mod_negotiation.c revision 5e657cb2e8af81202f9cb47de03fa9db5f0f22b9
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb/* Licensed to the Apache Software Foundation (ASF) under one or more
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * contributor license agreements. See the NOTICE file distributed with
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * this work for additional information regarding copyright ownership.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * The ASF licenses this file to You under the Apache License, Version 2.0
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * (the "License"); you may not use this file except in compliance with
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * the License. You may obtain a copy of the License at
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * http://www.apache.org/licenses/LICENSE-2.0
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * Unless required by applicable law or agreed to in writing, software
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * distributed under the License is distributed on an "AS IS" BASIS,
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * See the License for the specific language governing permissions and
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * limitations under the License.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb/*
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * mod_negotiation.c: keeps track of MIME types the client is willing to
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * accept, and contains code to handle type arbitration.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * rst
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#include "apr.h"
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#include "apr_strings.h"
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#include "apr_file_io.h"
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#include "apr_lib.h"
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#define APR_WANT_STRFUNC
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#include "apr_want.h"
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#include "ap_config.h"
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#include "httpd.h"
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#include "http_config.h"
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#include "http_request.h"
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#include "http_protocol.h"
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#include "http_core.h"
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#include "http_log.h"
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#include "util_script.h"
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#define MAP_FILE_MAGIC_TYPE "application/x-type-map"
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb/* Commands --- configuring document caching on a per (virtual?)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * server basis...
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbbtypedef struct {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb int forcelangpriority;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb apr_array_header_t *language_priority;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb} neg_dir_config;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb/* forcelangpriority flags
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#define FLP_UNDEF 0 /* Same as FLP_DEFAULT, but base overrides */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#define FLP_NONE 1 /* Return 406, HTTP_NOT_ACCEPTABLE */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#define FLP_PREFER 2 /* Use language_priority rather than MC */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#define FLP_FALLBACK 4 /* Use language_priority rather than NA */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#define FLP_DEFAULT FLP_PREFER
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb/* env evaluation
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#define DISCARD_ALL_ENCODINGS 1 /* no-gzip */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#define DISCARD_ALL_BUT_HTML 2 /* gzip-only-text/html */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbbmodule AP_MODULE_DECLARE_DATA negotiation_module;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbbstatic void *create_neg_dir_config(apr_pool_t *p, char *dummy)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb{
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg_dir_config *new = (neg_dir_config *) apr_palloc(p,
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb sizeof(neg_dir_config));
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb new->forcelangpriority = FLP_UNDEF;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb new->language_priority = NULL;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return new;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb}
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbbstatic void *merge_neg_dir_configs(apr_pool_t *p, void *basev, void *addv)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb{
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg_dir_config *base = (neg_dir_config *) basev;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg_dir_config *add = (neg_dir_config *) addv;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg_dir_config *new = (neg_dir_config *) apr_palloc(p,
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb sizeof(neg_dir_config));
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* give priority to the config in the subdirectory */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb new->forcelangpriority = (add->forcelangpriority != FLP_UNDEF)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb ? add->forcelangpriority
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb : base->forcelangpriority;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb new->language_priority = add->language_priority
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb ? add->language_priority
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb : base->language_priority;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return new;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb}
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
a2a0abd88b19e042a3eb2a9fa1702c25ad51303dwrowestatic const char *set_language_priority(cmd_parms *cmd, void *n_,
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb const char *lang)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb{
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg_dir_config *n = n_;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb const char **langp;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (!n->language_priority)
b45c1c292ff1fa635004ae81fa691f8cb3cdda85rbb n->language_priority = apr_array_make(cmd->pool, 4, sizeof(char *));
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb langp = (const char **) apr_array_push(n->language_priority);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *langp = lang;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return NULL;
a2a0abd88b19e042a3eb2a9fa1702c25ad51303dwrowe}
a2a0abd88b19e042a3eb2a9fa1702c25ad51303dwrowe
b38846b15c8891c6dec44dcc4f96ca40721bf663rbbstatic const char *set_force_priority(cmd_parms *cmd, void *n_, const char *w)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb{
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg_dir_config *n = n_;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (!strcasecmp(w, "None")) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (n->forcelangpriority & ~FLP_NONE) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return "Cannot combine ForceLanguagePriority options with None";
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb n->forcelangpriority = FLP_NONE;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb else if (!strcasecmp(w, "Prefer")) {
c3e342e5b0b9fea6617ee16d2da02c3ef2108126dougm if (n->forcelangpriority & FLP_NONE) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return "Cannot combine ForceLanguagePriority options None and "
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe "Prefer";
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe }
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe n->forcelangpriority |= FLP_PREFER;
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe }
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe else if (!strcasecmp(w, "Fallback")) {
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe if (n->forcelangpriority & FLP_NONE) {
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe return "Cannot combine ForceLanguagePriority options None and "
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe "Fallback";
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe }
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe n->forcelangpriority |= FLP_FALLBACK;
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe }
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe else {
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe return apr_pstrcat(cmd->pool, "Invalid ForceLanguagePriority option ",
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe w, NULL);
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe }
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe return NULL;
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe}
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowestatic const char *cache_negotiated_docs(cmd_parms *cmd, void *dummy,
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe int arg)
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe{
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe ap_set_module_config(cmd->server->module_config, &negotiation_module,
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe (arg ? "Cache" : NULL));
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe return NULL;
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe}
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowestatic int do_cache_negotiated_docs(server_rec *s)
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe{
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe return (ap_get_module_config(s->module_config,
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe &negotiation_module) != NULL);
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe}
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowestatic const command_rec negotiation_cmds[] =
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe{
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe AP_INIT_FLAG("CacheNegotiatedDocs", cache_negotiated_docs, NULL, RSRC_CONF,
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe "Either 'on' or 'off' (default)"),
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe AP_INIT_ITERATE("LanguagePriority", set_language_priority, NULL,
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe OR_FILEINFO,
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe "space-delimited list of MIME language abbreviations"),
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe AP_INIT_ITERATE("ForceLanguagePriority", set_force_priority, NULL,
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe OR_FILEINFO,
4775dfc34c90fada8c7c4d6a57ed8a3114d55c2dtrawick "Force LanguagePriority elections, either None, or "
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe "Fallback and/or Prefer"),
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe {NULL}
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe};
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe/*
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * Record of available info on a media type specified by the client
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * (we also use 'em for encodings and languages)
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowetypedef struct accept_rec {
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe char *name; /* MUST be lowercase */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe float quality;
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe float level;
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe char *charset; /* for content-type only */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe} accept_rec;
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe/*
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * Record of available info on a particular variant
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe *
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * Note that a few of these fields are updated by the actual negotiation
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * code. These are:
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe *
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * level_matched --- initialized to zero. Set to the value of level
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * if the client actually accepts this media type at that
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * level (and *not* if it got in on a wildcard). See level_cmp
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * below.
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * mime_stars -- initialized to zero. Set to the number of stars
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * present in the best matching Accept header element.
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * 1 for star/star, 2 for type/star and 3 for
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * type/subtype.
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe *
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * definite -- initialized to 1. Set to 0 if there is a match which
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * makes the variant non-definite according to the rules
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * in rfc2296.
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowetypedef struct var_rec {
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe request_rec *sub_req; /* May be NULL (is, for map files) */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe const char *mime_type; /* MUST be lowercase */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe const char *file_name; /* Set to 'this' (for map file body content) */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe apr_off_t body; /* Only for map file body content */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe const char *content_encoding;
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe apr_array_header_t *content_languages; /* list of lang. for this variant */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe const char *content_charset;
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe const char *description;
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe /* The next five items give the quality values for the dimensions
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * of negotiation for this variant. They are obtained from the
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * appropriate header lines, except for source_quality, which
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * is obtained from the variant itself (the 'qs' parameter value
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * from the variant's mime-type). Apart from source_quality,
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * these values are set when we find the quality for each variant
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * (see best_match()). source_quality is set from the 'qs' parameter
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * of the variant description or mime type: see set_mime_fields().
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe float lang_quality; /* quality of this variant's language */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe float encoding_quality; /* ditto encoding */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe float charset_quality; /* ditto charset */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe float mime_type_quality; /* ditto media type */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe float source_quality; /* source quality for this variant */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe /* Now some special values */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe float level; /* Auxiliary to content-type... */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe apr_off_t bytes; /* content length, if known */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe int lang_index; /* Index into LanguagePriority list */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe int is_pseudo_html; /* text/html, *or* the INCLUDES_MAGIC_TYPEs */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe /* Above are all written-once properties of the variant. The
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * three fields below are changed during negotiation:
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe float level_matched;
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe int mime_stars;
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe int definite;
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe} var_rec;
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe/* Something to carry around the state of negotiation (and to keep
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * all of this thread-safe)...
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbbtypedef struct {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb apr_pool_t *pool;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb request_rec *r;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg_dir_config *conf;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb char *dir_name;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb int accept_q; /* 1 if an Accept item has a q= param */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb float default_lang_quality; /* fiddle lang q for variants with no lang */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* the array pointers below are NULL if the corresponding accept
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * headers are not present
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb apr_array_header_t *accepts; /* accept_recs */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb apr_array_header_t *accept_encodings; /* accept_recs */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb apr_array_header_t *accept_charsets; /* accept_recs */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb apr_array_header_t *accept_langs; /* accept_recs */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb apr_array_header_t *avail_vars; /* available variants */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb int count_multiviews_variants; /* number of variants found on disk */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb int is_transparent; /* 1 if this resource is trans. negotiable */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb int dont_fiddle_headers; /* 1 if we may not fiddle with accept hdrs */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb int ua_supports_trans; /* 1 if ua supports trans negotiation */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb int send_alternates; /* 1 if we want to send an Alternates header */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb int may_choose; /* 1 if we may choose a variant for the client */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb int use_rvsa; /* 1 if we must use RVSA/1.0 negotiation algo */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb} negotiation_state;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb/* A few functions to manipulate var_recs.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * Cleaning out the fields...
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
c6ed63d53853f79bf8265c434d2e25c9db8a7fd8trawickstatic void clean_var_rec(var_rec *mime_info)
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe{
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe mime_info->sub_req = NULL;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe mime_info->mime_type = "";
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe mime_info->file_name = "";
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe mime_info->body = 0;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe mime_info->content_encoding = NULL;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe mime_info->content_languages = NULL;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe mime_info->content_charset = "";
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe mime_info->description = "";
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe mime_info->is_pseudo_html = 0;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe mime_info->level = 0.0f;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe mime_info->level_matched = 0.0f;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe mime_info->bytes = -1;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe mime_info->lang_index = -1;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe mime_info->mime_stars = 0;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe mime_info->definite = 1;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe mime_info->charset_quality = 1.0f;
2f1949bb0e3c209db94c8d521cba7380b9d11421trawick mime_info->encoding_quality = 1.0f;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe mime_info->lang_quality = 1.0f;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe mime_info->mime_type_quality = 1.0f;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe mime_info->source_quality = 0.0f;
2f1949bb0e3c209db94c8d521cba7380b9d11421trawick}
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe/* Initializing the relevant fields of a variant record from the
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe * accept_info read out of its content-type, one way or another.
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe */
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowestatic void set_mime_fields(var_rec *var, accept_rec *mime_info)
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe{
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe var->mime_type = mime_info->name;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe var->source_quality = mime_info->quality;
2f1949bb0e3c209db94c8d521cba7380b9d11421trawick var->level = mime_info->level;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe var->content_charset = mime_info->charset;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe var->is_pseudo_html = (!strcmp(var->mime_type, "text/html")
2f1949bb0e3c209db94c8d521cba7380b9d11421trawick || !strcmp(var->mime_type, INCLUDES_MAGIC_TYPE)
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe || !strcmp(var->mime_type, INCLUDES_MAGIC_TYPE3));
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe}
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe/* Create a variant list validator in r using info from vlistr. */
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowestatic void set_vlist_validator(request_rec *r, request_rec *vlistr)
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe{
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe /* Calculating the variant list validator is similar to
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe * calculating an etag for the source of the variant list
c6ed63d53853f79bf8265c434d2e25c9db8a7fd8trawick * information, so we use ap_make_etag(). Note that this
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * validator can be 'weak' in extreme case.
8aefbd756763807188d2e3ce336a8680e4893066wrowe */
8aefbd756763807188d2e3ce336a8680e4893066wrowe ap_update_mtime(vlistr, vlistr->finfo.mtime);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb r->vlist_validator = ap_make_etag(vlistr, 0);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* ap_set_etag will later take r->vlist_validator into account
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * when creating the etag header
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb}
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb/*****************************************************************
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * Parsing (lists of) media types and their parameters, as seen in
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * HTTPD header lines and elsewhere.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb/*
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * parse quality value. atof(3) is not well-usable here, because it
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * depends on the locale (argh).
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * However, RFC 2616 states:
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * 3.9 Quality Values
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * [...] HTTP/1.1 applications MUST NOT generate more than three digits
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * after the decimal point. User configuration of these values SHOULD also
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * be limited in this fashion.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * qvalue = ( "0" [ "." 0*3DIGIT ] )
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * | ( "1" [ "." 0*3("0") ] )
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * This is quite easy. If the supplied string doesn't match the above
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * definition (loosely), we simply return 1 (same as if there's no qvalue)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbbstatic float atoq(const char *string)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb{
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (!string || !*string) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return 1.0f;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb while (*string && apr_isspace(*string)) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb ++string;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* be tolerant and accept qvalues without leading zero
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * (also for backwards compat, where atof() was in use)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (*string != '.' && *string++ != '0') {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return 1.0f;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (*string == '.') {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* better only one division later, than dealing with fscking
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * IEEE format 0.1 factors ...
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb int i = 0;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (*++string >= '0' && *string <= '9') {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb i += (*string - '0') * 100;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (*++string >= '0' && *string <= '9') {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb i += (*string - '0') * 10;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (*++string > '0' && *string <= '9') {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb i += (*string - '0');
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return (float)i / 1000.0f;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return 0.0f;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb}
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb/*
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * Get a single mime type entry --- one media type and parameters;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * enter the values we recognize into the argument accept_rec
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
4ca6cbe768b4e0917ac0b76333c26a7d5396d454trawickstatic const char *get_entry(apr_pool_t *p, accept_rec *result,
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb const char *accept_line)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb{
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb result->quality = 1.0f;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb result->level = 0.0f;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb result->charset = "";
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /*
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * Note that this handles what I gather is the "old format",
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * Accept: text/html text/plain moo/zot
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * without any compatibility kludges --- if the token after the
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * MIME type begins with a semicolon, we know we're looking at parms,
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * otherwise, we know we aren't. (So why all the pissing and moaning
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * in the CERN server code? I must be missing something).
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb result->name = ap_get_token(p, &accept_line, 0);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb ap_str_tolower(result->name); /* You want case insensitive,
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * you'll *get* case insensitive.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* KLUDGE!!! Default HTML to level 2.0 unless the browser
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * *explicitly* says something else.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (!strcmp(result->name, "text/html") && (result->level == 0.0)) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb result->level = 2.0f;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb else if (!strcmp(result->name, INCLUDES_MAGIC_TYPE)) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb result->level = 2.0f;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb else if (!strcmp(result->name, INCLUDES_MAGIC_TYPE3)) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb result->level = 3.0f;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb while (*accept_line == ';') {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* Parameters ... */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb char *parm;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb char *cp;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb char *end;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb ++accept_line;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb parm = ap_get_token(p, &accept_line, 1);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* Look for 'var = value' --- and make sure the var is in lcase. */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb for (cp = parm; (*cp && !apr_isspace(*cp) && *cp != '='); ++cp) {
b29f87f4b6c6886a04dccc296177a7033f70dfedtrawick *cp = apr_tolower(*cp);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (!*cp) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb continue; /* No '='; just ignore it. */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *cp++ = '\0'; /* Delimit var */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb while (*cp && (apr_isspace(*cp) || *cp == '=')) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb ++cp;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (*cp == '"') {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb ++cp;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb for (end = cp;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb (*end && *end != '\n' && *end != '\r' && *end != '\"');
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb end++);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb else {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb for (end = cp; (*end && !apr_isspace(*end)); end++);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (*end) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *end = '\0'; /* strip ending quote or return */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb ap_str_tolower(cp);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (parm[0] == 'q'
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb && (parm[1] == '\0' || (parm[1] == 's' && parm[2] == '\0'))) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb result->quality = atoq(cp);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb else if (parm[0] == 'l' && !strcmp(&parm[1], "evel")) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb result->level = (float)atoi(cp);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb else if (!strcmp(parm, "charset")) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb result->charset = cp;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (*accept_line == ',') {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb ++accept_line;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return accept_line;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb}
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb/*****************************************************************
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * Dealing with header lines ...
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
a2a0abd88b19e042a3eb2a9fa1702c25ad51303dwrowe * Accept, Accept-Charset, Accept-Language and Accept-Encoding
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * are handled by do_header_line() - they all have the same
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * basic structure of a list of items of the format
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * name; q=N; charset=TEXT
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
2fa5b5878e7567e2875807c3e2a2b3b0d3ef74bewrowe * where charset is only valid in Accept.
2fa5b5878e7567e2875807c3e2a2b3b0d3ef74bewrowe */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbbstatic apr_array_header_t *do_header_line(apr_pool_t *p,
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb const char *accept_line)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb{
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb apr_array_header_t *accept_recs;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (!accept_line) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return NULL;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe accept_recs = apr_array_make(p, 40, sizeof(accept_rec));
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe while (*accept_line) {
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe accept_rec *new = (accept_rec *) apr_array_push(accept_recs);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb accept_line = get_entry(p, new, accept_line);
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe }
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe return accept_recs;
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe}
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe/* Given the text of the Content-Languages: line from the var map file,
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * return an array containing the languages of this variant
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbbstatic apr_array_header_t *do_languages_line(apr_pool_t *p,
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb const char **lang_line)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb{
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb apr_array_header_t *lang_recs = apr_array_make(p, 2, sizeof(char *));
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (!lang_line) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return lang_recs;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb while (**lang_line) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb char **new = (char **) apr_array_push(lang_recs);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *new = ap_get_token(p, lang_line, 0);
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe ap_str_tolower(*new);
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe if (**lang_line == ',' || **lang_line == ';') {
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe ++(*lang_line);
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe }
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe }
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe return lang_recs;
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe}
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe/*****************************************************************
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe *
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * Handling header lines from clients...
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe */
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowestatic negotiation_state *parse_accept_headers(request_rec *r)
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe{
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe negotiation_state *new =
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe (negotiation_state *) apr_pcalloc(r->pool, sizeof(negotiation_state));
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe accept_rec *elts;
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe apr_table_t *hdrs = r->headers_in;
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe int i;
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe new->pool = r->pool;
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe new->r = r;
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe new->conf = (neg_dir_config *)ap_get_module_config(r->per_dir_config,
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe &negotiation_module);
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe new->dir_name = ap_make_dirstr_parent(r->pool, r->filename);
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe new->accepts = do_header_line(r->pool, apr_table_get(hdrs, "Accept"));
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe /* calculate new->accept_q value */
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe if (new->accepts) {
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe elts = (accept_rec *) new->accepts->elts;
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe for (i = 0; i < new->accepts->nelts; ++i) {
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe if (elts[i].quality < 1.0) {
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe new->accept_q = 1;
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe }
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe }
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe }
580786e253bbe2fa462fdb24af47e52e1ef3dd83wrowe
580786e253bbe2fa462fdb24af47e52e1ef3dd83wrowe new->accept_encodings =
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe do_header_line(r->pool, apr_table_get(hdrs, "Accept-Encoding"));
6fed20de38221f6f8a60c0ab1d907f1173c443f4wrowe new->accept_langs =
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb do_header_line(r->pool, apr_table_get(hdrs, "Accept-Language"));
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb new->accept_charsets =
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb do_header_line(r->pool, apr_table_get(hdrs, "Accept-Charset"));
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* This is possibly overkill for some servers, heck, we have
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * only 33 index.html variants in docs/docroot (today).
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * Make this configurable?
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb new->avail_vars = apr_array_make(r->pool, 40, sizeof(var_rec));
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return new;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb}
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbbstatic void parse_negotiate_header(request_rec *r, negotiation_state *neg)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb{
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb const char *negotiate = apr_table_get(r->headers_in, "Negotiate");
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb char *tok;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* First, default to no TCN, no Alternates, and the original Apache
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * negotiation algorithm with fiddles for broken browser configs.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe * To save network bandwidth, we do not configure to send an
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * Alternates header to the user agent by default. User
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * agents that want an Alternates header for agent-driven
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * negotiation will have to request it by sending an
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * appropriate Negotiate header.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg->ua_supports_trans = 0;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg->send_alternates = 0;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg->may_choose = 1;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg->use_rvsa = 0;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg->dont_fiddle_headers = 0;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (!negotiate)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (strcmp(negotiate, "trans") == 0) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* Lynx 2.7 and 2.8 send 'negotiate: trans' even though they
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * do not support transparent content negotiation, so for Lynx we
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * ignore the negotiate header when its contents are exactly "trans".
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * If future versions of Lynx ever need to say 'negotiate: trans',
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * they can send the equivalent 'negotiate: trans, trans' instead
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * to avoid triggering the workaround below.
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe */
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe const char *ua = apr_table_get(r->headers_in, "User-Agent");
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (ua && (strncmp(ua, "Lynx", 4) == 0))
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe return;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg->may_choose = 0; /* An empty Negotiate would require 300 response */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb while ((tok = ap_get_list_item(neg->pool, &negotiate)) != NULL) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (strcmp(tok, "trans") == 0 ||
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb strcmp(tok, "vlist") == 0 ||
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb strcmp(tok, "guess-small") == 0 ||
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb apr_isdigit(tok[0]) ||
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb strcmp(tok, "*") == 0) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* The user agent supports transparent negotiation */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg->ua_supports_trans = 1;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe /* Send-alternates could be configurable, but note
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe * that it must be 1 if we have 'vlist' in the
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * negotiate header.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg->send_alternates = 1;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (strcmp(tok, "1.0") == 0) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* we may use the RVSA/1.0 algorithm, configure for it */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg->may_choose = 1;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg->use_rvsa = 1;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg->dont_fiddle_headers = 1;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb else if (tok[0] == '*') {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* we may use any variant selection algorithm, configure
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * to use the Apache algorithm
2fa5b5878e7567e2875807c3e2a2b3b0d3ef74bewrowe */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg->may_choose = 1;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* We disable header fiddles on the assumption that a
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe * client sending Negotiate knows how to send correct
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * headers which don't need fiddling.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg->dont_fiddle_headers = 1;
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe }
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe }
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe }
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe#ifdef NEG_DEBUG
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL, APLOGNO(00680)
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe "dont_fiddle_headers=%d use_rvsa=%d ua_supports_trans=%d "
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe "send_alternates=%d, may_choose=%d",
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg->dont_fiddle_headers, neg->use_rvsa,
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg->ua_supports_trans, neg->send_alternates, neg->may_choose);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb#endif
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb}
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb/* Sometimes clients will give us no Accept info at all; this routine sets
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * up the standard default for that case, and also arranges for us to be
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * willing to run a CGI script if we find one. (In fact, we set up to
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * dramatically prefer CGI scripts in cases where that's appropriate,
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * e.g., POST or when URI includes query args or extra path info).
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbbstatic void maybe_add_default_accepts(negotiation_state *neg,
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb int prefer_scripts)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb{
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb accept_rec *new_accept;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (!neg->accepts) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg->accepts = apr_array_make(neg->pool, 4, sizeof(accept_rec));
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe new_accept = (accept_rec *) apr_array_push(neg->accepts);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb new_accept->name = "*/*";
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb new_accept->quality = 1.0f;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb new_accept->level = 0.0f;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb new_accept = (accept_rec *) apr_array_push(neg->accepts);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb new_accept->name = CGI_MAGIC_TYPE;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (neg->use_rvsa) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb new_accept->quality = 0;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb else {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb new_accept->quality = prefer_scripts ? 2.0f : 0.001f;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb new_accept->level = 0.0f;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb}
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe/*****************************************************************
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * Parsing type-map files, in Roy's meta/http format augmented with
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * #-comments.
2fa5b5878e7567e2875807c3e2a2b3b0d3ef74bewrowe */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb/* Reading RFC822-style header lines, ignoring #-comments and
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe * handling continuations.
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe */
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe
ac06e54654494445fd3d39e90bd23b436b4f84ccwroweenum header_state {
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe header_eof, header_seen, header_sep
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe};
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe
b38846b15c8891c6dec44dcc4f96ca40721bf663rbbstatic enum header_state get_header_line(char *buffer, int len, apr_file_t *map)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb{
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb char *buf_end = buffer + len;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb char *cp;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb char c;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* Get a noncommented line */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb do {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (apr_file_gets(buffer, MAX_STRING_LEN, map) != APR_SUCCESS) {
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe return header_eof;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb } while (buffer[0] == '#');
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* If blank, just return it --- this ends information on this variant */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb for (cp = buffer; (*cp && apr_isspace(*cp)); ++cp) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb continue;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe if (*cp == '\0') {
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe return header_sep;
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe }
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe /* If non-blank, go looking for header lines, but note that we still
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe * have to treat comments specially...
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb cp += strlen(cp);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
8aefbd756763807188d2e3ce336a8680e4893066wrowe /* We need to shortcut the rest of this block following the Body:
8aefbd756763807188d2e3ce336a8680e4893066wrowe * tag - we will not look for continutation after this line.
8aefbd756763807188d2e3ce336a8680e4893066wrowe */
8aefbd756763807188d2e3ce336a8680e4893066wrowe if (!strncasecmp(buffer, "Body:", 5))
8aefbd756763807188d2e3ce336a8680e4893066wrowe return header_seen;
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe while (apr_file_getc(&c, map) != APR_EOF) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe if (c == '#') {
8aefbd756763807188d2e3ce336a8680e4893066wrowe /* Comment line */
8aefbd756763807188d2e3ce336a8680e4893066wrowe while (apr_file_getc(&c, map) != APR_EOF && c != '\n') {
8aefbd756763807188d2e3ce336a8680e4893066wrowe continue;
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe else if (apr_isspace(c)) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe /* Leading whitespace. POSSIBLE continuation line
8aefbd756763807188d2e3ce336a8680e4893066wrowe * Also, possibly blank --- if so, we ungetc() the final newline
8aefbd756763807188d2e3ce336a8680e4893066wrowe * so that we will pick up the blank line the next time 'round.
a2a0abd88b19e042a3eb2a9fa1702c25ad51303dwrowe */
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe while (c != '\n' && apr_isspace(c)) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe if(apr_file_getc(&c, map) != APR_SUCCESS)
8aefbd756763807188d2e3ce336a8680e4893066wrowe break;
2fa5b5878e7567e2875807c3e2a2b3b0d3ef74bewrowe }
2fa5b5878e7567e2875807c3e2a2b3b0d3ef74bewrowe
2fa5b5878e7567e2875807c3e2a2b3b0d3ef74bewrowe apr_file_ungetc(c, map);
d11e96111ae8731e8785837b4c927d81bf33c9b6wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe if (c == '\n') {
8aefbd756763807188d2e3ce336a8680e4893066wrowe return header_seen; /* Blank line */
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe /* Continuation */
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe while ( cp < buf_end - 2
8aefbd756763807188d2e3ce336a8680e4893066wrowe && (apr_file_getc(&c, map)) != APR_EOF
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe && c != '\n') {
a8d11d78181478da6a672f7fbc58b8d523351f49wrowe *cp++ = c;
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe }
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe *cp++ = '\n';
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe *cp = '\0';
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
a8d11d78181478da6a672f7fbc58b8d523351f49wrowe else {
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe /* Line beginning with something other than whitespace */
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe apr_file_ungetc(c, map);
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe return header_seen;
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe return header_seen;
8aefbd756763807188d2e3ce336a8680e4893066wrowe}
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowestatic apr_off_t get_body(char *buffer, apr_size_t *len, const char *tag,
8aefbd756763807188d2e3ce336a8680e4893066wrowe apr_file_t *map)
8aefbd756763807188d2e3ce336a8680e4893066wrowe{
8aefbd756763807188d2e3ce336a8680e4893066wrowe char *endbody;
8aefbd756763807188d2e3ce336a8680e4893066wrowe int bodylen;
8aefbd756763807188d2e3ce336a8680e4893066wrowe int taglen;
8aefbd756763807188d2e3ce336a8680e4893066wrowe apr_off_t pos;
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe taglen = strlen(tag);
8aefbd756763807188d2e3ce336a8680e4893066wrowe *len -= taglen;
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe /* We are at the first character following a body:tag\n entry
8aefbd756763807188d2e3ce336a8680e4893066wrowe * Suck in the body, then backspace to the first char after the
8aefbd756763807188d2e3ce336a8680e4893066wrowe * closing tag entry. If we fail to read, find the tag or back
8aefbd756763807188d2e3ce336a8680e4893066wrowe * up then we have a hosed file, so give up already
8aefbd756763807188d2e3ce336a8680e4893066wrowe */
8aefbd756763807188d2e3ce336a8680e4893066wrowe if (apr_file_read(map, buffer, len) != APR_SUCCESS) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe return -1;
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe /* put a copy of the tag *after* the data read from the file
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe * so that strstr() will find something with no reliance on
a8d11d78181478da6a672f7fbc58b8d523351f49wrowe * terminating '\0'
a8d11d78181478da6a672f7fbc58b8d523351f49wrowe */
a8d11d78181478da6a672f7fbc58b8d523351f49wrowe memcpy(buffer + *len, tag, taglen);
a8d11d78181478da6a672f7fbc58b8d523351f49wrowe endbody = strstr(buffer, tag);
a8d11d78181478da6a672f7fbc58b8d523351f49wrowe if (endbody == buffer + *len) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe return -1;
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe bodylen = endbody - buffer;
8aefbd756763807188d2e3ce336a8680e4893066wrowe endbody += taglen;
2fa5b5878e7567e2875807c3e2a2b3b0d3ef74bewrowe /* Skip all the trailing cruft after the end tag to the next line */
8aefbd756763807188d2e3ce336a8680e4893066wrowe while (*endbody) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe if (*endbody == '\n') {
d11e96111ae8731e8785837b4c927d81bf33c9b6wrowe ++endbody;
2fa5b5878e7567e2875807c3e2a2b3b0d3ef74bewrowe break;
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe ++endbody;
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe pos = -(apr_off_t)(*len - (endbody - buffer));
8aefbd756763807188d2e3ce336a8680e4893066wrowe if (apr_file_seek(map, APR_CUR, &pos) != APR_SUCCESS) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe return -1;
d11e96111ae8731e8785837b4c927d81bf33c9b6wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe /* Give the caller back the actual body's file offset and length */
8aefbd756763807188d2e3ce336a8680e4893066wrowe *len = bodylen;
8aefbd756763807188d2e3ce336a8680e4893066wrowe return pos - (endbody - buffer);
8aefbd756763807188d2e3ce336a8680e4893066wrowe}
2fa5b5878e7567e2875807c3e2a2b3b0d3ef74bewrowe
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe/* Stripping out RFC822 comments */
2fa5b5878e7567e2875807c3e2a2b3b0d3ef74bewrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowestatic void strip_paren_comments(char *hdr)
8aefbd756763807188d2e3ce336a8680e4893066wrowe{
8aefbd756763807188d2e3ce336a8680e4893066wrowe /* Hmmm... is this correct? In Roy's latest draft, (comments) can nest! */
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe /* Nope, it isn't correct. Fails to handle backslash escape as well. */
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe while (*hdr) {
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe if (*hdr == '"') {
8aefbd756763807188d2e3ce336a8680e4893066wrowe hdr = strchr(hdr, '"');
8aefbd756763807188d2e3ce336a8680e4893066wrowe if (hdr == NULL) {
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe return;
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe }
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe ++hdr;
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe }
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe else if (*hdr == '(') {
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe while (*hdr && *hdr != ')') {
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe *hdr++ = ' ';
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe }
a8d11d78181478da6a672f7fbc58b8d523351f49wrowe
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe if (*hdr) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe *hdr++ = ' ';
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe }
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe else {
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe ++hdr;
4fca95918a9c0ae93593806544b425d0adc2fcc3wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe}
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe/* Getting to a header body from the header */
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowestatic char *lcase_header_name_return_body(char *header, request_rec *r)
8aefbd756763807188d2e3ce336a8680e4893066wrowe{
8aefbd756763807188d2e3ce336a8680e4893066wrowe char *cp = header;
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe for ( ; *cp && *cp != ':' ; ++cp) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe *cp = apr_tolower(*cp);
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe if (!*cp) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe ap_log_rerror(APLOG_MARK, APLOG_ERR, 0, r, APLOGNO(00681)
8aefbd756763807188d2e3ce336a8680e4893066wrowe "Syntax error in type map, no ':' in %s for header %s",
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe r->filename, header);
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe return NULL;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe }
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe do {
8aefbd756763807188d2e3ce336a8680e4893066wrowe ++cp;
8aefbd756763807188d2e3ce336a8680e4893066wrowe } while (*cp && apr_isspace(*cp));
8aefbd756763807188d2e3ce336a8680e4893066wrowe
d11e96111ae8731e8785837b4c927d81bf33c9b6wrowe if (!*cp) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe ap_log_rerror(APLOG_MARK, APLOG_ERR, 0, r, APLOGNO(00682)
8aefbd756763807188d2e3ce336a8680e4893066wrowe "Syntax error in type map --- no header body: %s for %s",
8aefbd756763807188d2e3ce336a8680e4893066wrowe r->filename, header);
8aefbd756763807188d2e3ce336a8680e4893066wrowe return NULL;
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe return cp;
8aefbd756763807188d2e3ce336a8680e4893066wrowe}
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowestatic int read_type_map(apr_file_t **map, negotiation_state *neg,
8aefbd756763807188d2e3ce336a8680e4893066wrowe request_rec *rr)
8aefbd756763807188d2e3ce336a8680e4893066wrowe{
8aefbd756763807188d2e3ce336a8680e4893066wrowe request_rec *r = neg->r;
8aefbd756763807188d2e3ce336a8680e4893066wrowe apr_file_t *map_ = NULL;
8aefbd756763807188d2e3ce336a8680e4893066wrowe apr_status_t status;
8aefbd756763807188d2e3ce336a8680e4893066wrowe char buffer[MAX_STRING_LEN];
8aefbd756763807188d2e3ce336a8680e4893066wrowe enum header_state hstate;
8aefbd756763807188d2e3ce336a8680e4893066wrowe struct var_rec mime_info;
8aefbd756763807188d2e3ce336a8680e4893066wrowe int has_content;
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe if (!map)
8aefbd756763807188d2e3ce336a8680e4893066wrowe map = &map_;
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe /* We are not using multiviews */
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe neg->count_multiviews_variants = 0;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe if ((status = apr_file_open(map, rr->filename, APR_READ | APR_BUFFERED,
8aefbd756763807188d2e3ce336a8680e4893066wrowe APR_OS_DEFAULT, neg->pool)) != APR_SUCCESS) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe ap_log_rerror(APLOG_MARK, APLOG_ERR, status, r, APLOGNO(00683)
8aefbd756763807188d2e3ce336a8680e4893066wrowe "cannot access type map file: %s", rr->filename);
8aefbd756763807188d2e3ce336a8680e4893066wrowe if (APR_STATUS_IS_ENOTDIR(status) || APR_STATUS_IS_ENOENT(status)) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe return HTTP_NOT_FOUND;
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe else {
8aefbd756763807188d2e3ce336a8680e4893066wrowe return HTTP_FORBIDDEN;
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe clean_var_rec(&mime_info);
8aefbd756763807188d2e3ce336a8680e4893066wrowe has_content = 0;
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe do {
8aefbd756763807188d2e3ce336a8680e4893066wrowe hstate = get_header_line(buffer, MAX_STRING_LEN, *map);
b29f87f4b6c6886a04dccc296177a7033f70dfedtrawick
8aefbd756763807188d2e3ce336a8680e4893066wrowe if (hstate == header_seen) {
b29f87f4b6c6886a04dccc296177a7033f70dfedtrawick char *body1 = lcase_header_name_return_body(buffer, neg->r);
8aefbd756763807188d2e3ce336a8680e4893066wrowe const char *body;
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe if (body1 == NULL) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe return HTTP_INTERNAL_SERVER_ERROR;
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe strip_paren_comments(body1);
8aefbd756763807188d2e3ce336a8680e4893066wrowe body = body1;
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe if (!strncmp(buffer, "uri:", 4)) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe mime_info.file_name = ap_get_token(neg->pool, &body, 0);
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe }
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe else if (!strncmp(buffer, "content-type:", 13)) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe struct accept_rec accept_info;
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe get_entry(neg->pool, &accept_info, body);
8aefbd756763807188d2e3ce336a8680e4893066wrowe set_mime_fields(&mime_info, &accept_info);
8aefbd756763807188d2e3ce336a8680e4893066wrowe has_content = 1;
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe else if (!strncmp(buffer, "content-length:", 15)) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe char *errp;
8aefbd756763807188d2e3ce336a8680e4893066wrowe apr_off_t number;
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe body1 = ap_get_token(neg->pool, &body, 0);
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe if (apr_strtoff(&number, body1, &errp, 10) != APR_SUCCESS
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe || *errp || number < 0) {
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe ap_log_rerror(APLOG_MARK, APLOG_ERR, 0, r, APLOGNO(00684)
8aefbd756763807188d2e3ce336a8680e4893066wrowe "Parse error in type map, Content-Length: "
8aefbd756763807188d2e3ce336a8680e4893066wrowe "'%s' in %s is invalid.",
8aefbd756763807188d2e3ce336a8680e4893066wrowe body1, r->filename);
8aefbd756763807188d2e3ce336a8680e4893066wrowe break;
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe mime_info.bytes = number;
8aefbd756763807188d2e3ce336a8680e4893066wrowe has_content = 1;
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe else if (!strncmp(buffer, "content-language:", 17)) {
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe mime_info.content_languages = do_languages_line(neg->pool,
8aefbd756763807188d2e3ce336a8680e4893066wrowe &body);
8aefbd756763807188d2e3ce336a8680e4893066wrowe has_content = 1;
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe else if (!strncmp(buffer, "content-encoding:", 17)) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe mime_info.content_encoding = ap_get_token(neg->pool, &body, 0);
8aefbd756763807188d2e3ce336a8680e4893066wrowe has_content = 1;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe }
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe else if (!strncmp(buffer, "description:", 12)) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe char *desc = apr_pstrdup(neg->pool, body);
8aefbd756763807188d2e3ce336a8680e4893066wrowe char *cp;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe for (cp = desc; *cp; ++cp) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe if (*cp=='\n') *cp=' ';
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe if (cp>desc) *(cp-1)=0;
8aefbd756763807188d2e3ce336a8680e4893066wrowe mime_info.description = desc;
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe else if (!strncmp(buffer, "body:", 5)) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe char *tag = apr_pstrdup(neg->pool, body);
8aefbd756763807188d2e3ce336a8680e4893066wrowe char *eol = strchr(tag, '\0');
8aefbd756763807188d2e3ce336a8680e4893066wrowe apr_size_t len = MAX_STRING_LEN;
8aefbd756763807188d2e3ce336a8680e4893066wrowe while (--eol >= tag && apr_isspace(*eol))
8aefbd756763807188d2e3ce336a8680e4893066wrowe *eol = '\0';
8aefbd756763807188d2e3ce336a8680e4893066wrowe if ((mime_info.body = get_body(buffer, &len, tag, *map)) < 0) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe ap_log_rerror(APLOG_MARK, APLOG_ERR, 0, r, APLOGNO(00685)
8aefbd756763807188d2e3ce336a8680e4893066wrowe "Syntax error in type map, no end tag '%s'"
8aefbd756763807188d2e3ce336a8680e4893066wrowe "found in %s for Body: content.",
8aefbd756763807188d2e3ce336a8680e4893066wrowe tag, r->filename);
8aefbd756763807188d2e3ce336a8680e4893066wrowe break;
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe mime_info.bytes = len;
8aefbd756763807188d2e3ce336a8680e4893066wrowe mime_info.file_name = apr_filepath_name_get(rr->filename);
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe }
8aefbd756763807188d2e3ce336a8680e4893066wrowe }
2fa5b5878e7567e2875807c3e2a2b3b0d3ef74bewrowe else {
8aefbd756763807188d2e3ce336a8680e4893066wrowe if (*mime_info.file_name && has_content) {
2fa5b5878e7567e2875807c3e2a2b3b0d3ef74bewrowe void *new_var = apr_array_push(neg->avail_vars);
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe memcpy(new_var, (void *) &mime_info, sizeof(var_rec));
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe }
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe clean_var_rec(&mime_info);
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe has_content = 0;
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe }
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe } while (hstate != header_eof);
ac06e54654494445fd3d39e90bd23b436b4f84ccwrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe if (map_)
8aefbd756763807188d2e3ce336a8680e4893066wrowe apr_file_close(map_);
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe set_vlist_validator(r, rr);
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe return OK;
8aefbd756763807188d2e3ce336a8680e4893066wrowe}
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe/* Sort function used by read_types_multi. */
8aefbd756763807188d2e3ce336a8680e4893066wrowestatic int variantsortf(var_rec *a, var_rec *b) {
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe /* First key is the source quality, sort in descending order. */
8aefbd756763807188d2e3ce336a8680e4893066wrowe
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe /* XXX: note that we currently implement no method of setting the
8aefbd756763807188d2e3ce336a8680e4893066wrowe * source quality for multiviews variants, so we are always comparing
8aefbd756763807188d2e3ce336a8680e4893066wrowe * 1.0 to 1.0 for now
8aefbd756763807188d2e3ce336a8680e4893066wrowe */
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe if (a->source_quality < b->source_quality)
8aefbd756763807188d2e3ce336a8680e4893066wrowe return 1;
8aefbd756763807188d2e3ce336a8680e4893066wrowe if (a->source_quality > b->source_quality)
8aefbd756763807188d2e3ce336a8680e4893066wrowe return -1;
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowe /* Second key is the variant name */
8aefbd756763807188d2e3ce336a8680e4893066wrowe return strcmp(a->file_name, b->file_name);
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe}
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe/*****************************************************************
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe *
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe * Same as read_type_map, except we use a filtered directory listing
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe * as the map...
8aefbd756763807188d2e3ce336a8680e4893066wrowe */
8aefbd756763807188d2e3ce336a8680e4893066wrowe
8aefbd756763807188d2e3ce336a8680e4893066wrowestatic int read_types_multi(negotiation_state *neg)
8aefbd756763807188d2e3ce336a8680e4893066wrowe{
8aefbd756763807188d2e3ce336a8680e4893066wrowe request_rec *r = neg->r;
948096a99010fccf648814fecf38f75c689172d7wrowe
948096a99010fccf648814fecf38f75c689172d7wrowe char *filp;
948096a99010fccf648814fecf38f75c689172d7wrowe int prefix_len;
948096a99010fccf648814fecf38f75c689172d7wrowe apr_dir_t *dirp;
948096a99010fccf648814fecf38f75c689172d7wrowe apr_finfo_t dirent;
948096a99010fccf648814fecf38f75c689172d7wrowe apr_status_t status;
948096a99010fccf648814fecf38f75c689172d7wrowe struct var_rec mime_info;
948096a99010fccf648814fecf38f75c689172d7wrowe struct accept_rec accept_info;
948096a99010fccf648814fecf38f75c689172d7wrowe void *new_var;
948096a99010fccf648814fecf38f75c689172d7wrowe int anymatch = 0;
948096a99010fccf648814fecf38f75c689172d7wrowe
a2a0abd88b19e042a3eb2a9fa1702c25ad51303dwrowe clean_var_rec(&mime_info);
a2a0abd88b19e042a3eb2a9fa1702c25ad51303dwrowe
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (r->proxyreq || !r->filename
948096a99010fccf648814fecf38f75c689172d7wrowe || !ap_os_is_path_absolute(neg->pool, r->filename)) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return DECLINED;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
053497224246c4dbef9af594cacf5c00ed271e6cwrowe
948096a99010fccf648814fecf38f75c689172d7wrowe /* Only absolute paths here */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (!(filp = strrchr(r->filename, '/'))) {
948096a99010fccf648814fecf38f75c689172d7wrowe return DECLINED;
948096a99010fccf648814fecf38f75c689172d7wrowe }
948096a99010fccf648814fecf38f75c689172d7wrowe ++filp;
948096a99010fccf648814fecf38f75c689172d7wrowe prefix_len = strlen(filp);
948096a99010fccf648814fecf38f75c689172d7wrowe
948096a99010fccf648814fecf38f75c689172d7wrowe if ((status = apr_dir_open(&dirp, neg->dir_name,
948096a99010fccf648814fecf38f75c689172d7wrowe neg->pool)) != APR_SUCCESS) {
948096a99010fccf648814fecf38f75c689172d7wrowe ap_log_rerror(APLOG_MARK, APLOG_ERR, status, r, APLOGNO(00686)
948096a99010fccf648814fecf38f75c689172d7wrowe "cannot read directory for multi: %s", neg->dir_name);
948096a99010fccf648814fecf38f75c689172d7wrowe return HTTP_FORBIDDEN;
948096a99010fccf648814fecf38f75c689172d7wrowe }
948096a99010fccf648814fecf38f75c689172d7wrowe
948096a99010fccf648814fecf38f75c689172d7wrowe while (apr_dir_read(&dirent, APR_FINFO_DIRENT, dirp) == APR_SUCCESS) {
948096a99010fccf648814fecf38f75c689172d7wrowe apr_array_header_t *exception_list;
948096a99010fccf648814fecf38f75c689172d7wrowe request_rec *sub_req;
948096a99010fccf648814fecf38f75c689172d7wrowe
948096a99010fccf648814fecf38f75c689172d7wrowe /* Do we have a match? */
948096a99010fccf648814fecf38f75c689172d7wrowe#ifdef CASE_BLIND_FILESYSTEM
948096a99010fccf648814fecf38f75c689172d7wrowe if (strncasecmp(dirent.name, filp, prefix_len)) {
948096a99010fccf648814fecf38f75c689172d7wrowe#else
948096a99010fccf648814fecf38f75c689172d7wrowe if (strncmp(dirent.name, filp, prefix_len)) {
948096a99010fccf648814fecf38f75c689172d7wrowe#endif
948096a99010fccf648814fecf38f75c689172d7wrowe continue;
948096a99010fccf648814fecf38f75c689172d7wrowe }
948096a99010fccf648814fecf38f75c689172d7wrowe if (dirent.name[prefix_len] != '.') {
948096a99010fccf648814fecf38f75c689172d7wrowe continue;
948096a99010fccf648814fecf38f75c689172d7wrowe }
948096a99010fccf648814fecf38f75c689172d7wrowe
948096a99010fccf648814fecf38f75c689172d7wrowe /* Don't negotiate directories and other unusual files
948096a99010fccf648814fecf38f75c689172d7wrowe * Really shouldn't see anything but DIR/LNK/REG here,
948096a99010fccf648814fecf38f75c689172d7wrowe * and we aught to discover if the LNK was interesting.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
3f5b4558f5410fdac5d6feed7aab0c3668f9cd13wrowe * Of course, this only helps platforms that capture the
3f5b4558f5410fdac5d6feed7aab0c3668f9cd13wrowe * the filetype in apr_dir_read(), which most can once
3f5b4558f5410fdac5d6feed7aab0c3668f9cd13wrowe * they are optimized with some magic [it's known to the
3f5b4558f5410fdac5d6feed7aab0c3668f9cd13wrowe * dirent, not associated to the inode, on most FS's.]
3f5b4558f5410fdac5d6feed7aab0c3668f9cd13wrowe */
3f5b4558f5410fdac5d6feed7aab0c3668f9cd13wrowe if ((dirent.valid & APR_FINFO_TYPE) && (dirent.filetype == APR_DIR))
3f5b4558f5410fdac5d6feed7aab0c3668f9cd13wrowe continue;
948096a99010fccf648814fecf38f75c689172d7wrowe
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe /* Ok, something's here. Maybe nothing useful. Remember that
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe * we tried, if we completely fail, so we can reject the request!
053497224246c4dbef9af594cacf5c00ed271e6cwrowe */
053497224246c4dbef9af594cacf5c00ed271e6cwrowe anymatch = 1;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* See if it's something which we have access to, and which
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * has a known type and encoding.
948096a99010fccf648814fecf38f75c689172d7wrowe */
948096a99010fccf648814fecf38f75c689172d7wrowe sub_req = ap_sub_req_lookup_dirent(&dirent, r, AP_SUBREQ_MERGE_ARGS,
948096a99010fccf648814fecf38f75c689172d7wrowe NULL);
948096a99010fccf648814fecf38f75c689172d7wrowe
948096a99010fccf648814fecf38f75c689172d7wrowe /* Double check, we still don't multi-resolve non-ordinary files
948096a99010fccf648814fecf38f75c689172d7wrowe */
948096a99010fccf648814fecf38f75c689172d7wrowe if (sub_req->finfo.filetype != APR_REG) {
948096a99010fccf648814fecf38f75c689172d7wrowe /* XXX sub req not destroyed -- may be a bug/unintentional ? */
948096a99010fccf648814fecf38f75c689172d7wrowe continue;
948096a99010fccf648814fecf38f75c689172d7wrowe }
948096a99010fccf648814fecf38f75c689172d7wrowe
948096a99010fccf648814fecf38f75c689172d7wrowe /* If it has a handler, we'll pretend it's a CGI script,
948096a99010fccf648814fecf38f75c689172d7wrowe * since that's a good indication of the sort of thing it
053497224246c4dbef9af594cacf5c00ed271e6cwrowe * might be doing.
948096a99010fccf648814fecf38f75c689172d7wrowe */
948096a99010fccf648814fecf38f75c689172d7wrowe if (sub_req->handler && !sub_req->content_type) {
948096a99010fccf648814fecf38f75c689172d7wrowe ap_set_content_type(sub_req, CGI_MAGIC_TYPE);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
948096a99010fccf648814fecf38f75c689172d7wrowe
948096a99010fccf648814fecf38f75c689172d7wrowe /*
948096a99010fccf648814fecf38f75c689172d7wrowe * mod_mime will _always_ provide us the base name in the
948096a99010fccf648814fecf38f75c689172d7wrowe * ap-mime-exception-list, if it processed anything. If
948096a99010fccf648814fecf38f75c689172d7wrowe * this list is empty, give up immediately, there was
948096a99010fccf648814fecf38f75c689172d7wrowe * nothing interesting. For example, looking at the files
053497224246c4dbef9af594cacf5c00ed271e6cwrowe * readme.txt and readme.foo, we will throw away .foo if
948096a99010fccf648814fecf38f75c689172d7wrowe * it's an insignificant file (e.g. did not identify a
948096a99010fccf648814fecf38f75c689172d7wrowe * language, charset, encoding, content type or handler,)
948096a99010fccf648814fecf38f75c689172d7wrowe */
948096a99010fccf648814fecf38f75c689172d7wrowe exception_list =
948096a99010fccf648814fecf38f75c689172d7wrowe (apr_array_header_t *)apr_table_get(sub_req->notes,
948096a99010fccf648814fecf38f75c689172d7wrowe "ap-mime-exceptions-list");
948096a99010fccf648814fecf38f75c689172d7wrowe
948096a99010fccf648814fecf38f75c689172d7wrowe if (!exception_list) {
948096a99010fccf648814fecf38f75c689172d7wrowe ap_destroy_sub_req(sub_req);
948096a99010fccf648814fecf38f75c689172d7wrowe continue;
948096a99010fccf648814fecf38f75c689172d7wrowe }
948096a99010fccf648814fecf38f75c689172d7wrowe
948096a99010fccf648814fecf38f75c689172d7wrowe /* Each unregonized bit better match our base name, in sequence.
948096a99010fccf648814fecf38f75c689172d7wrowe * A test of index.html.foo will match index.foo or index.html.foo,
948096a99010fccf648814fecf38f75c689172d7wrowe * but it will never transpose the segments and allow index.foo.html
948096a99010fccf648814fecf38f75c689172d7wrowe * because that would introduce too much CPU consumption. Better that
948096a99010fccf648814fecf38f75c689172d7wrowe * we don't attempt a many-to-many match here.
948096a99010fccf648814fecf38f75c689172d7wrowe */
053497224246c4dbef9af594cacf5c00ed271e6cwrowe {
053497224246c4dbef9af594cacf5c00ed271e6cwrowe int nexcept = exception_list->nelts;
053497224246c4dbef9af594cacf5c00ed271e6cwrowe char **cur_except = (char**)exception_list->elts;
948096a99010fccf648814fecf38f75c689172d7wrowe char *segstart = filp, *segend, saveend;
053497224246c4dbef9af594cacf5c00ed271e6cwrowe
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb while (*segstart && nexcept) {
053497224246c4dbef9af594cacf5c00ed271e6cwrowe if (!(segend = strchr(segstart, '.')))
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb segend = strchr(segstart, '\0');
053497224246c4dbef9af594cacf5c00ed271e6cwrowe saveend = *segend;
053497224246c4dbef9af594cacf5c00ed271e6cwrowe *segend = '\0';
053497224246c4dbef9af594cacf5c00ed271e6cwrowe
053497224246c4dbef9af594cacf5c00ed271e6cwrowe#ifdef CASE_BLIND_FILESYSTEM
053497224246c4dbef9af594cacf5c00ed271e6cwrowe if (strcasecmp(segstart, *cur_except) == 0) {
053497224246c4dbef9af594cacf5c00ed271e6cwrowe#else
053497224246c4dbef9af594cacf5c00ed271e6cwrowe if (strcmp(segstart, *cur_except) == 0) {
053497224246c4dbef9af594cacf5c00ed271e6cwrowe#endif
948096a99010fccf648814fecf38f75c689172d7wrowe --nexcept;
948096a99010fccf648814fecf38f75c689172d7wrowe ++cur_except;
053497224246c4dbef9af594cacf5c00ed271e6cwrowe }
948096a99010fccf648814fecf38f75c689172d7wrowe
948096a99010fccf648814fecf38f75c689172d7wrowe if (!saveend)
053497224246c4dbef9af594cacf5c00ed271e6cwrowe break;
053497224246c4dbef9af594cacf5c00ed271e6cwrowe
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *segend = saveend;
948096a99010fccf648814fecf38f75c689172d7wrowe segstart = segend + 1;
948096a99010fccf648814fecf38f75c689172d7wrowe }
948096a99010fccf648814fecf38f75c689172d7wrowe
948096a99010fccf648814fecf38f75c689172d7wrowe if (nexcept) {
948096a99010fccf648814fecf38f75c689172d7wrowe /* Something you don't know is, something you don't know...
948096a99010fccf648814fecf38f75c689172d7wrowe */
948096a99010fccf648814fecf38f75c689172d7wrowe ap_destroy_sub_req(sub_req);
948096a99010fccf648814fecf38f75c689172d7wrowe continue;
948096a99010fccf648814fecf38f75c689172d7wrowe }
948096a99010fccf648814fecf38f75c689172d7wrowe }
948096a99010fccf648814fecf38f75c689172d7wrowe
948096a99010fccf648814fecf38f75c689172d7wrowe /*
948096a99010fccf648814fecf38f75c689172d7wrowe * If we failed the subrequest, or don't
948096a99010fccf648814fecf38f75c689172d7wrowe * know what we are serving, then continue.
948096a99010fccf648814fecf38f75c689172d7wrowe */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (sub_req->status != HTTP_OK || (!sub_req->content_type)) {
948096a99010fccf648814fecf38f75c689172d7wrowe ap_destroy_sub_req(sub_req);
948096a99010fccf648814fecf38f75c689172d7wrowe continue;
948096a99010fccf648814fecf38f75c689172d7wrowe }
948096a99010fccf648814fecf38f75c689172d7wrowe
948096a99010fccf648814fecf38f75c689172d7wrowe /* If it's a map file, we use that instead of the map
948096a99010fccf648814fecf38f75c689172d7wrowe * we're building...
696218c49632c863d18b25fa52ab63617088cb38wrowe */
948096a99010fccf648814fecf38f75c689172d7wrowe if (((sub_req->content_type) &&
948096a99010fccf648814fecf38f75c689172d7wrowe !strcmp(sub_req->content_type, MAP_FILE_MAGIC_TYPE)) ||
948096a99010fccf648814fecf38f75c689172d7wrowe ((sub_req->handler) &&
948096a99010fccf648814fecf38f75c689172d7wrowe !strcmp(sub_req->handler, "type-map"))) {
948096a99010fccf648814fecf38f75c689172d7wrowe
948096a99010fccf648814fecf38f75c689172d7wrowe apr_dir_close(dirp);
053497224246c4dbef9af594cacf5c00ed271e6cwrowe neg->avail_vars->nelts = 0;
948096a99010fccf648814fecf38f75c689172d7wrowe if (sub_req->status != HTTP_OK) {
948096a99010fccf648814fecf38f75c689172d7wrowe return sub_req->status;
053497224246c4dbef9af594cacf5c00ed271e6cwrowe }
053497224246c4dbef9af594cacf5c00ed271e6cwrowe return read_type_map(NULL, neg, sub_req);
948096a99010fccf648814fecf38f75c689172d7wrowe }
948096a99010fccf648814fecf38f75c689172d7wrowe
053497224246c4dbef9af594cacf5c00ed271e6cwrowe /* Have reasonable variant --- gather notes. */
948096a99010fccf648814fecf38f75c689172d7wrowe
053497224246c4dbef9af594cacf5c00ed271e6cwrowe mime_info.sub_req = sub_req;
053497224246c4dbef9af594cacf5c00ed271e6cwrowe mime_info.file_name = apr_pstrdup(neg->pool, dirent.name);
948096a99010fccf648814fecf38f75c689172d7wrowe if (sub_req->content_encoding) {
948096a99010fccf648814fecf38f75c689172d7wrowe mime_info.content_encoding = sub_req->content_encoding;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (sub_req->content_languages) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb mime_info.content_languages = sub_req->content_languages;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
a2a0abd88b19e042a3eb2a9fa1702c25ad51303dwrowe
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb get_entry(neg->pool, &accept_info, sub_req->content_type);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb set_mime_fields(&mime_info, &accept_info);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb new_var = apr_array_push(neg->avail_vars);
2fa5b5878e7567e2875807c3e2a2b3b0d3ef74bewrowe memcpy(new_var, (void *) &mime_info, sizeof(var_rec));
2fa5b5878e7567e2875807c3e2a2b3b0d3ef74bewrowe
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb neg->count_multiviews_variants++;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe clean_var_rec(&mime_info);
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe }
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe apr_dir_close(dirp);
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe /* We found some file names that matched. None could be served.
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe * Rather than fall out to autoindex or some other mapper, this
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe * request must die.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (anymatch && !neg->avail_vars->nelts) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb ap_log_rerror(APLOG_MARK, APLOG_ERR, 0, r, APLOGNO(00687)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb "Negotiation: discovered file(s) matching request: %s"
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb " (None could be negotiated).",
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb r->filename);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return HTTP_NOT_FOUND;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb set_vlist_validator(r, r);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* Sort the variants into a canonical order. The negotiation
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * result sometimes depends on the order of the variants. By
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * sorting the variants into a canonical order, rather than using
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * the order in which readdir() happens to return them, we ensure
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * that the negotiation result will be consistent over filesystem
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * backup/restores and over all mirror sites.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb qsort((void *) neg->avail_vars->elts, neg->avail_vars->nelts,
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb sizeof(var_rec), (int (*)(const void *, const void *)) variantsortf);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return OK;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb}
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb/*****************************************************************
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * And now for the code you've been waiting for... actually
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * finding a match to the client's requirements.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb/* Matching MIME types ... the star/star and foo/star commenting conventions
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * are implemented here. (You know what I mean by star/star, but just
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * try mentioning those three characters in a C comment). Using strcmp()
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * is legit, because everything has already been smashed to lowercase.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * Note also that if we get an exact match on the media type, we update
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * level_matched for use in level_cmp below...
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * We also give a value for mime_stars, which is used later. It should
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * be 1 for star/star, 2 for type/star and 3 for type/subtype.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbbstatic int mime_match(accept_rec *accept_r, var_rec *avail)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb{
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb const char *accept_type = accept_r->name;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb const char *avail_type = avail->mime_type;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb int len = strlen(accept_type);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (accept_type[0] == '*') { /* Anything matches star/star */
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe if (avail->mime_stars < 1) {
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe avail->mime_stars = 1;
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe }
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe return 1;
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe }
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe else if ((accept_type[len - 1] == '*') &&
dc8692c6c0ca616a09aa12dad005f2ef23baa1a0wrowe !strncmp(accept_type, avail_type, len - 2)) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (avail->mime_stars < 2) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb avail->mime_stars = 2;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return 1;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb else if (!strcmp(accept_type, avail_type)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb || (!strcmp(accept_type, "text/html")
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb && (!strcmp(avail_type, INCLUDES_MAGIC_TYPE)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb || !strcmp(avail_type, INCLUDES_MAGIC_TYPE3)))) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (accept_r->level >= avail->level) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb avail->level_matched = avail->level;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb avail->mime_stars = 3;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return 1;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return OK;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb}
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb/* This code implements a piece of the tie-breaking algorithm between
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * variants of equal quality. This piece is the treatment of variants
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * of the same base media type, but different levels. What we want to
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * return is the variant at the highest level that the client explicitly
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * claimed to accept.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * If all the variants available are at a higher level than that, or if
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * the client didn't say anything specific about this media type at all
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * and these variants just got in on a wildcard, we prefer the lowest
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * level, on grounds that that's the one that the client is least likely
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * to choke on.
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe *
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe * (This is all motivated by treatment of levels in HTML --- we only
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe * want to give level 3 to browsers that explicitly ask for it; browsers
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe * that don't, including HTTP/0.9 browsers that only get the implicit
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe * "Accept: * / *" [space added to avoid confusing cpp --- no, that
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe * syntax doesn't really work] should get HTML2 if available).
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe *
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe * (Note that this code only comes into play when we are choosing among
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe * variants of equal quality, where the draft standard gives us a fair
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe * bit of leeway about what to do. It ain't specified by the standard;
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe * rather, it is a choice made by this server about what to do in cases
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe * where the standard does not specify a unique course of action).
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe */
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowestatic int level_cmp(var_rec *var1, var_rec *var2)
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe{
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe /* Levels are only comparable between matching media types */
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe if (var1->is_pseudo_html && !var2->is_pseudo_html) {
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe return 0;
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe }
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe if (!var1->is_pseudo_html && strcmp(var1->mime_type, var2->mime_type)) {
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe return 0;
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe }
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe /* The result of the above if statements is that, if we get to
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe * here, both variants have the same mime_type or both are
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe * pseudo-html.
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe */
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* Take highest level that matched, if either did match. */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (var1->level_matched > var2->level_matched) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return 1;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (var1->level_matched < var2->level_matched) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return -1;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
4ca6cbe768b4e0917ac0b76333c26a7d5396d454trawick
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* Neither matched. Take lowest level, if there's a difference. */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (var1->level < var2->level) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return 1;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (var1->level > var2->level) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return -1;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* Tied */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return 0;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb}
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb/* Finding languages. The main entry point is set_language_quality()
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * which is called for each variant. It sets two elements in the
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * variant record:
48d2edbfb84e5559b5da0f8d614ccab805cc67a8rbb * language_quality - the 'q' value of the 'best' matching language
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * from Accept-Language: header (HTTP/1.1)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * lang_index - Non-negotiated language priority, using
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * position of language on the Accept-Language:
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * header, if present, else LanguagePriority
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * directive order.
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe *
b67fb549910fa0faf4cdd8aeaf9aeab51d4b6a92wrowe * When we do the variant checking for best variant, we use language
b67fb549910fa0faf4cdd8aeaf9aeab51d4b6a92wrowe * quality first, and if a tie, language_index next (this only applies
b67fb549910fa0faf4cdd8aeaf9aeab51d4b6a92wrowe * when _not_ using the RVSA/1.0 algorithm). If using the RVSA/1.0
b67fb549910fa0faf4cdd8aeaf9aeab51d4b6a92wrowe * algorithm, lang_index is never used.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
b67fb549910fa0faf4cdd8aeaf9aeab51d4b6a92wrowe * set_language_quality() calls find_lang_index() and find_default_index()
b67fb549910fa0faf4cdd8aeaf9aeab51d4b6a92wrowe * to set lang_index.
b67fb549910fa0faf4cdd8aeaf9aeab51d4b6a92wrowe */
b67fb549910fa0faf4cdd8aeaf9aeab51d4b6a92wrowe
b67fb549910fa0faf4cdd8aeaf9aeab51d4b6a92wrowestatic int find_lang_index(apr_array_header_t *accept_langs, char *lang)
1b839c67d5c0e4b1f22b44a4217f9860b420d47cwrowe{
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb const char **alang;
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe int i;
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe
1ab995011876f631740d68d960a6d729ddff5bfawrowe if (!lang || !accept_langs) {
b45c1c292ff1fa635004ae81fa691f8cb3cdda85rbb return -1;
b45c1c292ff1fa635004ae81fa691f8cb3cdda85rbb }
b45c1c292ff1fa635004ae81fa691f8cb3cdda85rbb
b45c1c292ff1fa635004ae81fa691f8cb3cdda85rbb alang = (const char **) accept_langs->elts;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb for (i = 0; i < accept_langs->nelts; ++i) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (!strncmp(lang, *alang, strlen(*alang))) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return i;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb alang += (accept_langs->elt_size / sizeof(char*));
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return -1;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb}
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb/* set_default_lang_quality() sets the quality we apply to variants
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * which have no language assigned to them. If none of the variants
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * have a language, we are not negotiating on language, so all are
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * acceptable, and we set the default q value to 1.0. However if
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * some of the variants have languages, we set this default to 0.0001.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * The value of this default will be applied to all variants with
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * no explicit language -- which will have the effect of making them
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * acceptable, but only if no variants with an explicit language
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * are acceptable. The default q value set here is assigned to variants
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * with no language type in set_language_quality().
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * Note that if using the RVSA/1.0 algorithm, we don't use this
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * fiddle.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
efa1a34b0a7785fc72863eff175b0cfc1ecb0e38wrowestatic void set_default_lang_quality(negotiation_state *neg)
117026201e6d8fe7d82416b8a7324830f5a87292wrowe{
117026201e6d8fe7d82416b8a7324830f5a87292wrowe var_rec *avail_recs = (var_rec *) neg->avail_vars->elts;
117026201e6d8fe7d82416b8a7324830f5a87292wrowe int j;
117026201e6d8fe7d82416b8a7324830f5a87292wrowe
117026201e6d8fe7d82416b8a7324830f5a87292wrowe if (!neg->dont_fiddle_headers) {
117026201e6d8fe7d82416b8a7324830f5a87292wrowe for (j = 0; j < neg->avail_vars->nelts; ++j) {
117026201e6d8fe7d82416b8a7324830f5a87292wrowe var_rec *variant = &avail_recs[j];
117026201e6d8fe7d82416b8a7324830f5a87292wrowe if (variant->content_languages &&
117026201e6d8fe7d82416b8a7324830f5a87292wrowe variant->content_languages->nelts) {
117026201e6d8fe7d82416b8a7324830f5a87292wrowe neg->default_lang_quality = 0.0001f;
117026201e6d8fe7d82416b8a7324830f5a87292wrowe return;
117026201e6d8fe7d82416b8a7324830f5a87292wrowe }
117026201e6d8fe7d82416b8a7324830f5a87292wrowe }
1ab995011876f631740d68d960a6d729ddff5bfawrowe }
117026201e6d8fe7d82416b8a7324830f5a87292wrowe
117026201e6d8fe7d82416b8a7324830f5a87292wrowe neg->default_lang_quality = 1.0f;
117026201e6d8fe7d82416b8a7324830f5a87292wrowe}
117026201e6d8fe7d82416b8a7324830f5a87292wrowe
55eb5bb774cfb861542b827fbf4c30e6efbbfc44wrowe/* Set the language_quality value in the variant record. Also
117026201e6d8fe7d82416b8a7324830f5a87292wrowe * assigns lang_index for ForceLanguagePriority.
117026201e6d8fe7d82416b8a7324830f5a87292wrowe *
117026201e6d8fe7d82416b8a7324830f5a87292wrowe * To find the language_quality value, we look for the 'q' value
117026201e6d8fe7d82416b8a7324830f5a87292wrowe * of the 'best' matching language on the Accept-Language
117026201e6d8fe7d82416b8a7324830f5a87292wrowe * header. The 'best' match is the language on Accept-Language
117026201e6d8fe7d82416b8a7324830f5a87292wrowe * header which matches the language of this variant either fully,
117026201e6d8fe7d82416b8a7324830f5a87292wrowe * or as far as the prefix marker (-). If two or more languages
117026201e6d8fe7d82416b8a7324830f5a87292wrowe * match, use the longest string from the Accept-Language header
117026201e6d8fe7d82416b8a7324830f5a87292wrowe * (see HTTP/1.1 [14.4])
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe *
117026201e6d8fe7d82416b8a7324830f5a87292wrowe * When a variant has multiple languages, we find the 'best'
117026201e6d8fe7d82416b8a7324830f5a87292wrowe * match for each variant language tag as above, then select the
e7505ba54ac56ae30e4e250f912f3dbaf92ca45fwrowe * one with the highest q value. Because both the accept-header
e7505ba54ac56ae30e4e250f912f3dbaf92ca45fwrowe * and variant can have multiple languages, we now have a hairy
e7505ba54ac56ae30e4e250f912f3dbaf92ca45fwrowe * loop-within-a-loop here.
117026201e6d8fe7d82416b8a7324830f5a87292wrowe *
117026201e6d8fe7d82416b8a7324830f5a87292wrowe * If the variant has no language and we have no Accept-Language
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * items, leave the quality at 1.0 and return.
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe *
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * If the variant has no language, we use the default as set by
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe * set_default_lang_quality() (1.0 if we are not negotiating on
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe * language, 0.001 if we are).
efa1a34b0a7785fc72863eff175b0cfc1ecb0e38wrowe *
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe * Following the setting of the language quality, we drop through to
beda1fb2f11c52ca4612460a5d5ba47398143efbwrowe * set the old 'lang_index'. This is set based on either the order
beda1fb2f11c52ca4612460a5d5ba47398143efbwrowe * of the languages on the Accept-Language header, or the
beda1fb2f11c52ca4612460a5d5ba47398143efbwrowe * order on the LanguagePriority directive. This is only used
beda1fb2f11c52ca4612460a5d5ba47398143efbwrowe * in the negotiation if the language qualities tie.
beda1fb2f11c52ca4612460a5d5ba47398143efbwrowe */
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowestatic void set_language_quality(negotiation_state *neg, var_rec *variant)
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe{
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe int forcepriority = neg->conf->forcelangpriority;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe if (forcepriority == FLP_UNDEF) {
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe forcepriority = FLP_DEFAULT;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe }
117026201e6d8fe7d82416b8a7324830f5a87292wrowe
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe if (!variant->content_languages || !variant->content_languages->nelts) {
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe /* This variant has no content-language, so use the default
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe * quality factor for variants with no content-language
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe * (previously set by set_default_lang_quality()).
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe * Leave the factor alone (it remains at 1.0) when we may not fiddle
117026201e6d8fe7d82416b8a7324830f5a87292wrowe * with the headers.
117026201e6d8fe7d82416b8a7324830f5a87292wrowe */
efa1a34b0a7785fc72863eff175b0cfc1ecb0e38wrowe if (!neg->dont_fiddle_headers) {
117026201e6d8fe7d82416b8a7324830f5a87292wrowe variant->lang_quality = neg->default_lang_quality;
117026201e6d8fe7d82416b8a7324830f5a87292wrowe }
117026201e6d8fe7d82416b8a7324830f5a87292wrowe if (!neg->accept_langs) {
117026201e6d8fe7d82416b8a7324830f5a87292wrowe return; /* no accept-language header */
117026201e6d8fe7d82416b8a7324830f5a87292wrowe }
117026201e6d8fe7d82416b8a7324830f5a87292wrowe return;
117026201e6d8fe7d82416b8a7324830f5a87292wrowe }
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe else {
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe /* Variant has one (or more) languages. Look for the best
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe * match. We do this by going through each language on the
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe * variant description looking for a match on the
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe * Accept-Language header. The best match is the longest
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe * matching language on the header. The final result is the
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe * best q value from all the languages on the variant
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe * description.
117026201e6d8fe7d82416b8a7324830f5a87292wrowe */
117026201e6d8fe7d82416b8a7324830f5a87292wrowe
117026201e6d8fe7d82416b8a7324830f5a87292wrowe if (!neg->accept_langs) {
117026201e6d8fe7d82416b8a7324830f5a87292wrowe /* no accept-language header makes the variant indefinite */
117026201e6d8fe7d82416b8a7324830f5a87292wrowe variant->definite = 0;
117026201e6d8fe7d82416b8a7324830f5a87292wrowe }
a2a0abd88b19e042a3eb2a9fa1702c25ad51303dwrowe else { /* There is an accept-language with 0 or more items */
a2a0abd88b19e042a3eb2a9fa1702c25ad51303dwrowe accept_rec *accs = (accept_rec *) neg->accept_langs->elts;
a2a0abd88b19e042a3eb2a9fa1702c25ad51303dwrowe accept_rec *best = NULL, *star = NULL;
117026201e6d8fe7d82416b8a7324830f5a87292wrowe accept_rec *bestthistag;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe char *lang, *p;
117026201e6d8fe7d82416b8a7324830f5a87292wrowe float fiddle_q = 0.0f;
117026201e6d8fe7d82416b8a7324830f5a87292wrowe int any_match_on_star = 0;
117026201e6d8fe7d82416b8a7324830f5a87292wrowe int i, j;
117026201e6d8fe7d82416b8a7324830f5a87292wrowe apr_size_t alen, longest_lang_range_len;
a2a0abd88b19e042a3eb2a9fa1702c25ad51303dwrowe
a2a0abd88b19e042a3eb2a9fa1702c25ad51303dwrowe for (j = 0; j < variant->content_languages->nelts; ++j) {
73fbb0a2e9cb209173d6c319c57260cbf29c8cc7wrowe p = NULL;
73fbb0a2e9cb209173d6c319c57260cbf29c8cc7wrowe bestthistag = NULL;
73fbb0a2e9cb209173d6c319c57260cbf29c8cc7wrowe longest_lang_range_len = 0;
73fbb0a2e9cb209173d6c319c57260cbf29c8cc7wrowe
650ac07cba9ab3ad9bdeda50b78c278442604814wrowe /* lang is the variant's language-tag, which is the one
650ac07cba9ab3ad9bdeda50b78c278442604814wrowe * we are allowed to use the prefix of in HTTP/1.1
650ac07cba9ab3ad9bdeda50b78c278442604814wrowe */
650ac07cba9ab3ad9bdeda50b78c278442604814wrowe lang = ((char **) (variant->content_languages->elts))[j];
117026201e6d8fe7d82416b8a7324830f5a87292wrowe
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe /* now find the best (i.e. longest) matching
1067418d9ed9ed9daeb3ca4f74e72db810c49833wrowe * Accept-Language header language. We put the best match
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * for this tag in bestthistag. We cannot update the
1067418d9ed9ed9daeb3ca4f74e72db810c49833wrowe * overall best (based on q value) because the best match
1067418d9ed9ed9daeb3ca4f74e72db810c49833wrowe * for this tag is the longest language item on the accept
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * header, not necessarily the highest q.
1067418d9ed9ed9daeb3ca4f74e72db810c49833wrowe */
117026201e6d8fe7d82416b8a7324830f5a87292wrowe for (i = 0; i < neg->accept_langs->nelts; ++i) {
117026201e6d8fe7d82416b8a7324830f5a87292wrowe if (!strcmp(accs[i].name, "*")) {
b67fb549910fa0faf4cdd8aeaf9aeab51d4b6a92wrowe if (!star) {
b67fb549910fa0faf4cdd8aeaf9aeab51d4b6a92wrowe star = &accs[i];
b67fb549910fa0faf4cdd8aeaf9aeab51d4b6a92wrowe }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb continue;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* Find language. We match if either the variant
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * language tag exactly matches the language range
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe * from the accept header, or a prefix of the variant
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * language tag up to a '-' character matches the
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * whole of the language range in the Accept-Language
1b839c67d5c0e4b1f22b44a4217f9860b420d47cwrowe * header. Note that HTTP/1.x allows any number of
b45c1c292ff1fa635004ae81fa691f8cb3cdda85rbb * '-' characters in a tag or range, currently only
1ab995011876f631740d68d960a6d729ddff5bfawrowe * tags with zero or one '-' characters are defined
1ab995011876f631740d68d960a6d729ddff5bfawrowe * for general use (see rfc1766).
1ab995011876f631740d68d960a6d729ddff5bfawrowe *
1ab995011876f631740d68d960a6d729ddff5bfawrowe * We only use language range in the Accept-Language
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe * header the best match for the variant language tag
e68544ae924174ca227ede8e2e722cefa00ea0d3wrowe * if it is longer than the previous best match.
1ab995011876f631740d68d960a6d729ddff5bfawrowe */
b67fb549910fa0faf4cdd8aeaf9aeab51d4b6a92wrowe
b67fb549910fa0faf4cdd8aeaf9aeab51d4b6a92wrowe alen = strlen(accs[i].name);
b67fb549910fa0faf4cdd8aeaf9aeab51d4b6a92wrowe
b45c1c292ff1fa635004ae81fa691f8cb3cdda85rbb if ((strlen(lang) >= alen) &&
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb !strncmp(lang, accs[i].name, alen) &&
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe ((lang[alen] == 0) || (lang[alen] == '-')) ) {
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe
ecc4a080f07af3fbc1b91bbd00997ec1d592c6f9wrowe if (alen > longest_lang_range_len) {
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe longest_lang_range_len = alen;
2d2dadb81bf34e3bc9321eabcd971a738431b364wrowe bestthistag = &accs[i];
2d2dadb81bf34e3bc9321eabcd971a738431b364wrowe }
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe }
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe if (!bestthistag && !neg->dont_fiddle_headers) {
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe /* The next bit is a fiddle. Some browsers might
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe * be configured to send more specific language
2d2dadb81bf34e3bc9321eabcd971a738431b364wrowe * ranges than desirable. For example, an
ecc4a080f07af3fbc1b91bbd00997ec1d592c6f9wrowe * Accept-Language of en-US should never match
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * variants with languages en or en-GB. But US
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * English speakers might pick en-US as their
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * language choice. So this fiddle checks if the
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe * language range has a prefix, and if so, it
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe * matches variants which match that prefix with a
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe * priority of 0.001. So a request for en-US would
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe * match variants of types en and en-GB, but at
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe * much lower priority than matches of en-US
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * directly, or of any other language listed on
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * the Accept-Language header. Note that this
af7e32b660b02a378e91d40987e59b28864db954jwoolley * fiddle does not handle multi-level prefixes.
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe */
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe if ((p = strchr(accs[i].name, '-'))) {
5bb29f57ae0184d2b3c1cdf35132f8ceb011f882wrowe int plen = p - accs[i].name;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (!strncmp(lang, accs[i].name, plen)) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb fiddle_q = 0.001f;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe }
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe }
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe /* Finished looking at Accept-Language headers, the best
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * (longest) match is in bestthistag, or NULL if no match
e16c4a220d3410c6f3424e7f6b12f3cd5455dddejwoolley */
e16c4a220d3410c6f3424e7f6b12f3cd5455dddejwoolley if (!best ||
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe (bestthistag && bestthistag->quality > best->quality)) {
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe best = bestthistag;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe }
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe /* See if the tag matches on a * in the Accept-Language
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * header. If so, record this fact for later use
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe */
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe if (!bestthistag && star) {
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe any_match_on_star = 1;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe /* If one of the language tags of the variant matched on *, we
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe * need to see if its q is better than that of any non-* match
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe * on any other tag of the variant. If so the * match takes
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe * precedence and the overall match is not definite.
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe if ( any_match_on_star &&
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb ((best && star->quality > best->quality) ||
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb (!best)) ) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb best = star;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb variant->definite = 0;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe variant->lang_quality = best ? best->quality : fiddle_q;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe }
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe }
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe /* Handle the ForceDefaultLanguage overrides, based on the best match
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe * to LanguagePriority order. The best match is the lowest index of
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe * any LanguagePriority match.
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe */
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe if (((forcepriority & FLP_PREFER)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb && (variant->lang_index < 0))
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb || ((forcepriority & FLP_FALLBACK)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb && !variant->lang_quality))
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb int bestidx = -1;
a2a0abd88b19e042a3eb2a9fa1702c25ad51303dwrowe int j;
a2a0abd88b19e042a3eb2a9fa1702c25ad51303dwrowe
a2a0abd88b19e042a3eb2a9fa1702c25ad51303dwrowe for (j = 0; j < variant->content_languages->nelts; ++j)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb {
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe /* lang is the variant's language-tag, which is the one
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * we are allowed to use the prefix of in HTTP/1.1
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb char *lang = ((char **) (variant->content_languages->elts))[j];
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb int idx = -1;
a2a0abd88b19e042a3eb2a9fa1702c25ad51303dwrowe
a2a0abd88b19e042a3eb2a9fa1702c25ad51303dwrowe /* If we wish to fallback or
73fbb0a2e9cb209173d6c319c57260cbf29c8cc7wrowe * we use our own LanguagePriority index.
73fbb0a2e9cb209173d6c319c57260cbf29c8cc7wrowe */
73fbb0a2e9cb209173d6c319c57260cbf29c8cc7wrowe idx = find_lang_index(neg->conf->language_priority, lang);
650ac07cba9ab3ad9bdeda50b78c278442604814wrowe if ((idx >= 0) && ((bestidx == -1) || (idx < bestidx))) {
73fbb0a2e9cb209173d6c319c57260cbf29c8cc7wrowe bestidx = idx;
73fbb0a2e9cb209173d6c319c57260cbf29c8cc7wrowe }
73fbb0a2e9cb209173d6c319c57260cbf29c8cc7wrowe }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (bestidx >= 0) {
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe if (variant->lang_quality) {
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe if (forcepriority & FLP_PREFER) {
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe variant->lang_index = bestidx;
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe }
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe }
290ecc1ddceca1ed49bc1a5338921264b5c3e07cwrowe else {
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe if (forcepriority & FLP_FALLBACK) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb variant->lang_index = bestidx;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb variant->lang_quality = .0001f;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb variant->definite = 0;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb}
58097d7d8d1a394092374b9f6ddf76b7993724a4rbb
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe/* Determining the content length --- if the map didn't tell us,
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe * we have to do a stat() and remember for next time.
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe */
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowestatic apr_off_t find_content_length(negotiation_state *neg, var_rec *variant)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb{
a2a0abd88b19e042a3eb2a9fa1702c25ad51303dwrowe apr_finfo_t statb;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
a2a0abd88b19e042a3eb2a9fa1702c25ad51303dwrowe if (variant->bytes < 0) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if ( variant->sub_req
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe && (variant->sub_req->finfo.valid & APR_FINFO_SIZE)) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb variant->bytes = variant->sub_req->finfo.size;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe else {
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe char *fullname = ap_make_full_path(neg->pool, neg->dir_name,
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb variant->file_name);
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
83a8dc5a596a8a1b9d14f063268287d123b9ed7ewrowe if (apr_stat(&statb, fullname,
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb APR_FINFO_SIZE, neg->pool) == APR_SUCCESS) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb variant->bytes = statb.size;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return variant->bytes;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb}
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb/* For a given variant, find the best matching Accept: header
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * and assign the Accept: header's quality value to the
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * mime_type_quality field of the variant, for later use in
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * determining the best matching variant.
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbbstatic void set_accept_quality(negotiation_state *neg, var_rec *variant)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb{
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb int i;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb accept_rec *accept_recs;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb float q = 0.0f;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb int q_definite = 1;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /* if no Accept: header, leave quality alone (will
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * remain at the default value of 1)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb *
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * XXX: This if is currently never true because of the effect of
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * maybe_add_default_accepts().
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb */
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (!neg->accepts) {
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb if (variant->mime_type && *variant->mime_type)
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb variant->definite = 0;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb return;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb }
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb accept_recs = (accept_rec *) neg->accepts->elts;
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb /*
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * Go through each of the ranges on the Accept: header,
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * looking for the 'best' match with this variant's
b38846b15c8891c6dec44dcc4f96ca40721bf663rbb * content-type. We use the best match's quality
* value (from the Accept: header) for this variant's
* mime_type_quality field.
*
* The best match is determined like this:
* type/type is better than type/ * is better than * / *
* if match is type/type, use the level mime param if available
*/
for (i = 0; i < neg->accepts->nelts; ++i) {
accept_rec *type = &accept_recs[i];
int prev_mime_stars;
prev_mime_stars = variant->mime_stars;
if (!mime_match(type, variant)) {
continue; /* didn't match the content type at all */
}
else {
/* did match - see if there were less or more stars than
* in previous match
*/
if (prev_mime_stars == variant->mime_stars) {
continue; /* more stars => not as good a match */
}
}
/* If we are allowed to mess with the q-values
* and have no explicit q= parameters in the accept header,
* make wildcards very low, so we have a low chance
* of ending up with them if there's something better.
*/
if (!neg->dont_fiddle_headers && !neg->accept_q &&
variant->mime_stars == 1) {
q = 0.01f;
}
else if (!neg->dont_fiddle_headers && !neg->accept_q &&
variant->mime_stars == 2) {
q = 0.02f;
}
else {
q = type->quality;
}
q_definite = (variant->mime_stars == 3);
}
variant->mime_type_quality = q;
variant->definite = variant->definite && q_definite;
}
/* For a given variant, find the 'q' value of the charset given
* on the Accept-Charset line. If no charsets are listed,
* assume value of '1'.
*/
static void set_charset_quality(negotiation_state *neg, var_rec *variant)
{
int i;
accept_rec *accept_recs;
const char *charset = variant->content_charset;
accept_rec *star = NULL;
/* if no Accept-Charset: header, leave quality alone (will
* remain at the default value of 1)
*/
if (!neg->accept_charsets) {
if (charset && *charset)
variant->definite = 0;
return;
}
accept_recs = (accept_rec *) neg->accept_charsets->elts;
if (charset == NULL || !*charset) {
/* Charset of variant not known */
/* if not a text / * type, leave quality alone */
if (!(!strncmp(variant->mime_type, "text/", 5)
|| !strcmp(variant->mime_type, INCLUDES_MAGIC_TYPE)
|| !strcmp(variant->mime_type, INCLUDES_MAGIC_TYPE3)
))
return;
/* Don't go guessing if we are in strict header mode,
* e.g. when running the rvsa, as any guess won't be reflected
* in the variant list or content-location headers.
*/
if (neg->dont_fiddle_headers)
return;
charset = "iso-8859-1"; /* The default charset for HTTP text types */
}
/*
* Go through each of the items on the Accept-Charset header,
* looking for a match with this variant's charset. If none
* match, charset is unacceptable, so set quality to 0.
*/
for (i = 0; i < neg->accept_charsets->nelts; ++i) {
accept_rec *type = &accept_recs[i];
if (!strcmp(type->name, charset)) {
variant->charset_quality = type->quality;
return;
}
else if (strcmp(type->name, "*") == 0) {
star = type;
}
}
/* No explicit match */
if (star) {
variant->charset_quality = star->quality;
variant->definite = 0;
return;
}
/* If this variant is in charset iso-8859-1, the default is 1.0 */
if (strcmp(charset, "iso-8859-1") == 0) {
variant->charset_quality = 1.0f;
}
else {
variant->charset_quality = 0.0f;
}
}
/* is_identity_encoding is included for back-compat, but does anyone
* use 7bit, 8bin or binary in their var files??
*/
static int is_identity_encoding(const char *enc)
{
return (!enc || !enc[0] || !strcmp(enc, "7bit") || !strcmp(enc, "8bit")
|| !strcmp(enc, "binary"));
}
/*
* set_encoding_quality determines whether the encoding for a particular
* variant is acceptable for the user-agent.
*
* The rules for encoding are that if the user-agent does not supply
* any Accept-Encoding header, then all encodings are allowed but a
* variant with no encoding should be preferred.
* If there is an empty Accept-Encoding header, then no encodings are
* acceptable. If there is a non-empty Accept-Encoding header, then
* any of the listed encodings are acceptable, as well as no encoding
* unless the "identity" encoding is specifically excluded.
*/
static void set_encoding_quality(negotiation_state *neg, var_rec *variant)
{
accept_rec *accept_recs;
const char *enc = variant->content_encoding;
accept_rec *star = NULL;
float value_if_not_found = 0.0f;
int i;
if (!neg->accept_encodings) {
/* We had no Accept-Encoding header, assume that all
* encodings are acceptable with a low quality,
* but we prefer no encoding if available.
*/
if (!enc || is_identity_encoding(enc))
variant->encoding_quality = 1.0f;
else
variant->encoding_quality = 0.5f;
return;
}
if (!enc || is_identity_encoding(enc)) {
enc = "identity";
value_if_not_found = 0.0001f;
}
accept_recs = (accept_rec *) neg->accept_encodings->elts;
/* Go through each of the encodings on the Accept-Encoding: header,
* looking for a match with our encoding. x- prefixes are ignored.
*/
if (enc[0] == 'x' && enc[1] == '-') {
enc += 2;
}
for (i = 0; i < neg->accept_encodings->nelts; ++i) {
char *name = accept_recs[i].name;
if (name[0] == 'x' && name[1] == '-') {
name += 2;
}
if (!strcmp(name, enc)) {
variant->encoding_quality = accept_recs[i].quality;
return;
}
if (strcmp(name, "*") == 0) {
star = &accept_recs[i];
}
}
/* No explicit match */
if (star) {
variant->encoding_quality = star->quality;
return;
}
/* Encoding not found on Accept-Encoding: header, so it is
* _not_ acceptable unless it is the identity (no encoding)
*/
variant->encoding_quality = value_if_not_found;
}
/*************************************************************
* Possible results of the variant selection algorithm
*/
enum algorithm_results {
alg_choice = 1, /* choose variant */
alg_list /* list variants */
};
/* Below is the 'best_match' function. It returns an int, which has
* one of the two values alg_choice or alg_list, which give the result
* of the variant selection algorithm. alg_list means that no best
* variant was found by the algorithm, alg_choice means that a best
* variant was found and should be returned. The list/choice
* terminology comes from TCN (rfc2295), but is used in a more generic
* way here. The best variant is returned in *pbest. best_match has
* two possible algorithms for determining the best variant: the
* RVSA/1.0 algorithm (from RFC2296), and the standard Apache
* algorithm. These are split out into separate functions
* (is_variant_better_rvsa() and is_variant_better()). Selection of
* one is through the neg->use_rvsa flag.
*
* The call to best_match also creates full information, including
* language, charset, etc quality for _every_ variant. This is needed
* for generating a correct Vary header, and can be used for the
* Alternates header, the human-readable list responses and 406 errors.
*/
/* Firstly, the RVSA/1.0 (HTTP Remote Variant Selection Algorithm
* v1.0) from rfc2296. This is the algorithm that goes together with
* transparent content negotiation (TCN).
*/
static int is_variant_better_rvsa(negotiation_state *neg, var_rec *variant,
var_rec *best, float *p_bestq)
{
float bestq = *p_bestq, q;
/* TCN does not cover negotiation on content-encoding. For now,
* we ignore the encoding unless it was explicitly excluded.
*/
if (variant->encoding_quality == 0.0f)
return 0;
q = variant->mime_type_quality *
variant->source_quality *
variant->charset_quality *
variant->lang_quality;
/* RFC 2296 calls for the result to be rounded to 5 decimal places,
* but we don't do that because it serves no useful purpose other
* than to ensure that a remote algorithm operates on the same
* precision as ours. That is silly, since what we obviously want
* is for the algorithm to operate on the best available precision
* regardless of who runs it. Since the above calculation may
* result in significant variance at 1e-12, rounding would be bogus.
*/
#ifdef NEG_DEBUG
ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL, APLOGNO(00688)
"Variant: file=%s type=%s lang=%s sourceq=%1.3f "
"mimeq=%1.3f langq=%1.3f charq=%1.3f encq=%1.3f "
"q=%1.5f definite=%d",
(variant->file_name ? variant->file_name : ""),
(variant->mime_type ? variant->mime_type : ""),
(variant->content_languages
? apr_array_pstrcat(neg->pool, variant->content_languages, ',')
: ""),
variant->source_quality,
variant->mime_type_quality,
variant->lang_quality,
variant->charset_quality,
variant->encoding_quality,
q,
variant->definite);
#endif
if (q <= 0.0f) {
return 0;
}
if (q > bestq) {
*p_bestq = q;
return 1;
}
if (q == bestq) {
/* If the best variant's encoding is of lesser quality than
* this variant, then we prefer this variant
*/
if (variant->encoding_quality > best->encoding_quality) {
*p_bestq = q;
return 1;
}
}
return 0;
}
/* Negotiation algorithm as used by previous versions of Apache
* (just about).
*/
static int is_variant_better(negotiation_state *neg, var_rec *variant,
var_rec *best, float *p_bestq)
{
float bestq = *p_bestq, q;
int levcmp;
/* For non-transparent negotiation, server can choose how
* to handle the negotiation. We'll use the following in
* order: content-type, language, content-type level, charset,
* content encoding, content length.
*
* For each check, we have three possible outcomes:
* This variant is worse than current best: return 0
* This variant is better than the current best:
* assign this variant's q to *p_bestq, and return 1
* This variant is just as desirable as the current best:
* drop through to the next test.
*
* This code is written in this long-winded way to allow future
* customisation, either by the addition of additional
* checks, or to allow the order of the checks to be determined
* by configuration options (e.g. we might prefer to check
* language quality _before_ content type).
*/
/* First though, eliminate this variant if it is not
* acceptable by type, charset, encoding or language.
*/
#ifdef NEG_DEBUG
ap_log_error(APLOG_MARK, APLOG_STARTUP, 0, NULL, APLOGNO(00689)
"Variant: file=%s type=%s lang=%s sourceq=%1.3f "
"mimeq=%1.3f langq=%1.3f langidx=%d charq=%1.3f encq=%1.3f ",
(variant->file_name ? variant->file_name : ""),
(variant->mime_type ? variant->mime_type : ""),
(variant->content_languages
? apr_array_pstrcat(neg->pool, variant->content_languages, ',')
: ""),
variant->source_quality,
variant->mime_type_quality,
variant->lang_quality,
variant->lang_index,
variant->charset_quality,
variant->encoding_quality);
#endif
if (variant->encoding_quality == 0.0f ||
variant->lang_quality == 0.0f ||
variant->source_quality == 0.0f ||
variant->charset_quality == 0.0f ||
variant->mime_type_quality == 0.0f) {
return 0; /* don't consider unacceptables */
}
q = variant->mime_type_quality * variant->source_quality;
if (q == 0.0 || q < bestq) {
return 0;
}
if (q > bestq || !best) {
*p_bestq = q;
return 1;
}
/* language */
if (variant->lang_quality < best->lang_quality) {
return 0;
}
if (variant->lang_quality > best->lang_quality) {
*p_bestq = q;
return 1;
}
/* if language qualities were equal, try the LanguagePriority stuff */
if (best->lang_index != -1 &&
(variant->lang_index == -1 || variant->lang_index > best->lang_index)) {
return 0;
}
if (variant->lang_index != -1 &&
(best->lang_index == -1 || variant->lang_index < best->lang_index)) {
*p_bestq = q;
return 1;
}
/* content-type level (sometimes used with text/html, though we
* support it on other types too)
*/
levcmp = level_cmp(variant, best);
if (levcmp == -1) {
return 0;
}
if (levcmp == 1) {
*p_bestq = q;
return 1;
}
/* charset */
if (variant->charset_quality < best->charset_quality) {
return 0;
}
/* If the best variant's charset is ISO-8859-1 and this variant has
* the same charset quality, then we prefer this variant
*/
if (variant->charset_quality > best->charset_quality ||
((variant->content_charset != NULL &&
*variant->content_charset != '\0' &&
strcmp(variant->content_charset, "iso-8859-1") != 0) &&
(best->content_charset == NULL ||
*best->content_charset == '\0' ||
strcmp(best->content_charset, "iso-8859-1") == 0))) {
*p_bestq = q;
return 1;
}
/* Prefer the highest value for encoding_quality.
*/
if (variant->encoding_quality < best->encoding_quality) {
return 0;
}
if (variant->encoding_quality > best->encoding_quality) {
*p_bestq = q;
return 1;
}
/* content length if all else equal */
if (find_content_length(neg, variant) >= find_content_length(neg, best)) {
return 0;
}
/* ok, to get here means every thing turned out equal, except
* we have a shorter content length, so use this variant
*/
*p_bestq = q;
return 1;
}
/* figure out, whether a variant is in a specific language
* it returns also false, if the variant has no language.
*/
static int variant_has_language(var_rec *variant, const char *lang)
{
int j, max;
/* fast exit */
if ( !lang
|| !variant->content_languages
|| !(max = variant->content_languages->nelts)) {
return 0;
}
for (j = 0; j < max; ++j) {
if (!strcmp(lang,
((char **) (variant->content_languages->elts))[j])) {
return 1;
}
}
return 0;
}
/* check for environment variables 'no-gzip' and
* 'gzip-only-text/html' to get a behaviour similiar
* to mod_deflate
*/
static int discard_variant_by_env(var_rec *variant, int discard)
{
if ( is_identity_encoding(variant->content_encoding)
|| !strcmp(variant->content_encoding, "identity")) {
return 0;
}
return ( (discard == DISCARD_ALL_ENCODINGS)
|| (discard == DISCARD_ALL_BUT_HTML
&& (!variant->mime_type
|| strncmp(variant->mime_type, "text/html", 9))));
}
static int best_match(negotiation_state *neg, var_rec **pbest)
{
int j;
var_rec *best;
float bestq = 0.0f;
enum algorithm_results algorithm_result;
int may_discard = 0;
var_rec *avail_recs = (var_rec *) neg->avail_vars->elts;
/* fetch request dependent variables
* prefer-language: prefer a certain language.
*/
const char *preferred_language = apr_table_get(neg->r->subprocess_env,
"prefer-language");
/* no-gzip: do not send encoded documents */
if (apr_table_get(neg->r->subprocess_env, "no-gzip")) {
may_discard = DISCARD_ALL_ENCODINGS;
}
/* gzip-only-text/html: send encoded documents only
* if they are text/html. (no-gzip has a higher priority).
*/
else {
const char *env_value = apr_table_get(neg->r->subprocess_env,
"gzip-only-text/html");
if (env_value && !strcmp(env_value, "1")) {
may_discard = DISCARD_ALL_BUT_HTML;
}
}
set_default_lang_quality(neg);
/*
* Find the 'best' variant
* We run the loop possibly twice: if "prefer-language"
* environment variable is set but we did not find an appropriate
* best variant. In that case forget the preferred language and
* negotiate over all variants.
*/
do {
best = NULL;
for (j = 0; j < neg->avail_vars->nelts; ++j) {
var_rec *variant = &avail_recs[j];
/* if this variant is encoded somehow and there are special
* variables set, we do not negotiate it. see above.
*/
if ( may_discard
&& discard_variant_by_env(variant, may_discard)) {
continue;
}
/* if a language is preferred, but the current variant
* is not in that language, then drop it for now
*/
if ( preferred_language
&& !variant_has_language(variant, preferred_language)) {
continue;
}
/* Find all the relevant 'quality' values from the
* Accept... headers, and store in the variant. This also
* prepares for sending an Alternates header etc so we need to
* do it even if we do not actually plan to find a best
* variant.
*/
set_accept_quality(neg, variant);
/* accept the preferred language, even when it's not listed within
* the Accept-Language header
*/
if (preferred_language) {
variant->lang_quality = 1.0f;
variant->definite = 1;
}
else {
set_language_quality(neg, variant);
}
set_encoding_quality(neg, variant);
set_charset_quality(neg, variant);
/* Only do variant selection if we may actually choose a
* variant for the client
*/
if (neg->may_choose) {
/* Now find out if this variant is better than the current
* best, either using the RVSA/1.0 algorithm, or Apache's
* internal server-driven algorithm. Presumably other
* server-driven algorithms are possible, and could be
* implemented here.
*/
if (neg->use_rvsa) {
if (is_variant_better_rvsa(neg, variant, best, &bestq)) {
best = variant;
}
}
else {
if (is_variant_better(neg, variant, best, &bestq)) {
best = variant;
}
}
}
}
/* We now either have a best variant, or no best variant */
if (neg->use_rvsa) {
/* calculate result for RVSA/1.0 algorithm:
* only a choice response if the best variant has q>0
* and is definite
*/
algorithm_result = (best && best->definite) && (bestq > 0) ?
alg_choice : alg_list;
}
else {
/* calculate result for Apache negotiation algorithm */
algorithm_result = bestq > 0 ? alg_choice : alg_list;
}
/* run the loop again, if the "prefer-language" got no clear result */
if (preferred_language && (!best || algorithm_result != alg_choice)) {
preferred_language = NULL;
continue;
}
break;
} while (1);
/* Returning a choice response with a non-neighboring variant is a
* protocol security error in TCN (see rfc2295). We do *not*
* verify here that the variant and URI are neighbors, even though
* we may return alg_choice. We depend on the environment (the
* caller) to only declare the resource transparently negotiable if
* all variants are neighbors.
*/
*pbest = best;
return algorithm_result;
}
/* Sets response headers for a negotiated response.
* neg->is_transparent determines whether a transparently negotiated
* response or a plain `server driven negotiation' response is
* created. Applicable headers are Alternates, Vary, and TCN.
*
* The Vary header we create is sometimes longer than is required for
* the correct caching of negotiated results by HTTP/1.1 caches. For
* example if we have 3 variants x.html, x.ps.en and x.ps.nl, and if
* the Accept: header assigns a 0 quality to .ps, then the results of
* the two server-side negotiation algorithms we currently implement
* will never depend on Accept-Language so we could return `Vary:
* negotiate, accept' instead of the longer 'Vary: negotiate, accept,
* accept-language' which the code below will return. A routine for
* computing the exact minimal Vary header would be a huge pain to code
* and maintain though, especially because we need to take all possible
* twiddles in the server-side negotiation algorithms into account.
*/
static void set_neg_headers(request_rec *r, negotiation_state *neg,
int alg_result)
{
apr_table_t *hdrs;
var_rec *avail_recs = (var_rec *) neg->avail_vars->elts;
const char *sample_type = NULL;
const char *sample_language = NULL;
const char *sample_encoding = NULL;
const char *sample_charset = NULL;
char *lang;
char *qstr;
apr_off_t len;
apr_array_header_t *arr;
int max_vlist_array = (neg->avail_vars->nelts * 21);
int first_variant = 1;
int vary_by_type = 0;
int vary_by_language = 0;
int vary_by_charset = 0;
int vary_by_encoding = 0;
int j;
/* In order to avoid O(n^2) memory copies in building Alternates,
* we preallocate a apr_table_t with the maximum substrings possible,
* fill it with the variant list, and then concatenate the entire array.
* Note that if you change the number of substrings pushed, you also
* need to change the calculation of max_vlist_array above.
*/
if (neg->send_alternates && neg->avail_vars->nelts)
arr = apr_array_make(r->pool, max_vlist_array, sizeof(char *));
else
arr = NULL;
/* Put headers into err_headers_out, since send_http_header()
* outputs both headers_out and err_headers_out.
*/
hdrs = r->err_headers_out;
for (j = 0; j < neg->avail_vars->nelts; ++j) {
var_rec *variant = &avail_recs[j];
if (variant->content_languages && variant->content_languages->nelts) {
lang = apr_array_pstrcat(r->pool, variant->content_languages, ',');
}
else {
lang = NULL;
}
/* Calculate Vary by looking for any difference between variants */
if (first_variant) {
sample_type = variant->mime_type;
sample_charset = variant->content_charset;
sample_language = lang;
sample_encoding = variant->content_encoding;
}
else {
if (!vary_by_type &&
strcmp(sample_type ? sample_type : "",
variant->mime_type ? variant->mime_type : "")) {
vary_by_type = 1;
}
if (!vary_by_charset &&
strcmp(sample_charset ? sample_charset : "",
variant->content_charset ?
variant->content_charset : "")) {
vary_by_charset = 1;
}
if (!vary_by_language &&
strcmp(sample_language ? sample_language : "",
lang ? lang : "")) {
vary_by_language = 1;
}
if (!vary_by_encoding &&
strcmp(sample_encoding ? sample_encoding : "",
variant->content_encoding ?
variant->content_encoding : "")) {
vary_by_encoding = 1;
}
}
first_variant = 0;
if (!neg->send_alternates)
continue;
/* Generate the string components for this Alternates entry */
*((const char **) apr_array_push(arr)) = "{\"";
*((const char **) apr_array_push(arr)) = ap_escape_path_segment(r->pool, variant->file_name);
*((const char **) apr_array_push(arr)) = "\" ";
qstr = (char *) apr_palloc(r->pool, 6);
apr_snprintf(qstr, 6, "%1.3f", variant->source_quality);
/* Strip trailing zeros (saves those valuable network bytes) */
if (qstr[4] == '0') {
qstr[4] = '\0';
if (qstr[3] == '0') {
qstr[3] = '\0';
if (qstr[2] == '0') {
qstr[1] = '\0';
}
}
}
*((const char **) apr_array_push(arr)) = qstr;
if (variant->mime_type && *variant->mime_type) {
*((const char **) apr_array_push(arr)) = " {type ";
*((const char **) apr_array_push(arr)) = variant->mime_type;
*((const char **) apr_array_push(arr)) = "}";
}
if (variant->content_charset && *variant->content_charset) {
*((const char **) apr_array_push(arr)) = " {charset ";
*((const char **) apr_array_push(arr)) = variant->content_charset;
*((const char **) apr_array_push(arr)) = "}";
}
if (lang) {
*((const char **) apr_array_push(arr)) = " {language ";
*((const char **) apr_array_push(arr)) = lang;
*((const char **) apr_array_push(arr)) = "}";
}
if (variant->content_encoding && *variant->content_encoding) {
/* Strictly speaking, this is non-standard, but so is TCN */
*((const char **) apr_array_push(arr)) = " {encoding ";
*((const char **) apr_array_push(arr)) = variant->content_encoding;
*((const char **) apr_array_push(arr)) = "}";
}
/* Note that the Alternates specification (in rfc2295) does
* not require that we include {length x}, so we could omit it
* if determining the length is too expensive. We currently
* always include it though.
*
* If the variant is a CGI script, find_content_length would
* return the length of the script, not the output it
* produces, so we check for the presence of a handler and if
* there is one we don't add a length.
*
* XXX: TODO: This check does not detect a CGI script if we
* get the variant from a type map. This needs to be fixed
* (without breaking things if the type map specifies a
* content-length, which currently leads to the correct result).
*/
if (!(variant->sub_req && variant->sub_req->handler)
&& (len = find_content_length(neg, variant)) >= 0) {
*((const char **) apr_array_push(arr)) = " {length ";
*((const char **) apr_array_push(arr)) = apr_off_t_toa(r->pool,
len);
*((const char **) apr_array_push(arr)) = "}";
}
*((const char **) apr_array_push(arr)) = "}";
*((const char **) apr_array_push(arr)) = ", "; /* trimmed below */
}
if (neg->send_alternates && neg->avail_vars->nelts) {
arr->nelts--; /* remove last comma */
apr_table_mergen(hdrs, "Alternates",
apr_array_pstrcat(r->pool, arr, '\0'));
}
if (neg->is_transparent || vary_by_type || vary_by_language ||
vary_by_charset || vary_by_encoding) {
apr_table_mergen(hdrs, "Vary", 2 + apr_pstrcat(r->pool,
neg->is_transparent ? ", negotiate" : "",
vary_by_type ? ", accept" : "",
vary_by_language ? ", accept-language" : "",
vary_by_charset ? ", accept-charset" : "",
vary_by_encoding ? ", accept-encoding" : "", NULL));
}
if (neg->is_transparent) { /* Create TCN response header */
apr_table_setn(hdrs, "TCN",
alg_result == alg_list ? "list" : "choice");
}
}
/**********************************************************************
*
* Return an HTML list of variants. This is output as part of the
* choice response or 406 status body.
*/
static char *make_variant_list(request_rec *r, negotiation_state *neg)
{
apr_array_header_t *arr;
int i;
int max_vlist_array = (neg->avail_vars->nelts * 15) + 2;
/* In order to avoid O(n^2) memory copies in building the list,
* we preallocate a apr_table_t with the maximum substrings possible,
* fill it with the variant list, and then concatenate the entire array.
*/
arr = apr_array_make(r->pool, max_vlist_array, sizeof(char *));
*((const char **) apr_array_push(arr)) = "Available variants:\n<ul>\n";
for (i = 0; i < neg->avail_vars->nelts; ++i) {
var_rec *variant = &((var_rec *) neg->avail_vars->elts)[i];
const char *filename = variant->file_name ? variant->file_name : "";
apr_array_header_t *languages = variant->content_languages;
const char *description = variant->description
? variant->description
: "";
/* The format isn't very neat, and it would be nice to make
* the tags human readable (eg replace 'language en' with 'English').
* Note that if you change the number of substrings pushed, you also
* need to change the calculation of max_vlist_array above.
*/
*((const char **) apr_array_push(arr)) = "<li><a href=\"";
*((const char **) apr_array_push(arr)) = ap_escape_path_segment(r->pool, filename);
*((const char **) apr_array_push(arr)) = "\">";
*((const char **) apr_array_push(arr)) = ap_escape_html(r->pool, filename);
*((const char **) apr_array_push(arr)) = "</a> ";
*((const char **) apr_array_push(arr)) = description;
if (variant->mime_type && *variant->mime_type) {
*((const char **) apr_array_push(arr)) = ", type ";
*((const char **) apr_array_push(arr)) = variant->mime_type;
}
if (languages && languages->nelts) {
*((const char **) apr_array_push(arr)) = ", language ";
*((const char **) apr_array_push(arr)) = apr_array_pstrcat(r->pool,
languages, ',');
}
if (variant->content_charset && *variant->content_charset) {
*((const char **) apr_array_push(arr)) = ", charset ";
*((const char **) apr_array_push(arr)) = variant->content_charset;
}
if (variant->content_encoding) {
*((const char **) apr_array_push(arr)) = ", encoding ";
*((const char **) apr_array_push(arr)) = variant->content_encoding;
}
*((const char **) apr_array_push(arr)) = "</li>\n";
}
*((const char **) apr_array_push(arr)) = "</ul>\n";
return apr_array_pstrcat(r->pool, arr, '\0');
}
static void store_variant_list(request_rec *r, negotiation_state *neg)
{
if (r->main == NULL) {
apr_table_setn(r->notes, "variant-list", make_variant_list(r, neg));
}
else {
apr_table_setn(r->main->notes, "variant-list",
make_variant_list(r->main, neg));
}
}
/* Called if we got a "Choice" response from the variant selection algorithm.
* It checks the result of the chosen variant to see if it
* is itself negotiated (if so, return error HTTP_VARIANT_ALSO_VARIES).
* Otherwise, add the appropriate headers to the current response.
*/
static int setup_choice_response(request_rec *r, negotiation_state *neg,
var_rec *variant)
{
request_rec *sub_req;
const char *sub_vary;
if (!variant->sub_req) {
int status;
sub_req = ap_sub_req_lookup_file(variant->file_name, r, r->output_filters);
status = sub_req->status;
if (status != HTTP_OK &&
!apr_table_get(sub_req->err_headers_out, "TCN")) {
ap_destroy_sub_req(sub_req);
return status;
}
variant->sub_req = sub_req;
}
else {
sub_req = variant->sub_req;
}
/* The variant selection algorithm told us to return a "Choice"
* response. This is the normal variant response, with
* some extra headers. First, ensure that the chosen
* variant did or will not itself engage in transparent negotiation.
* If not, set the appropriate headers, and fall through to
* the normal variant handling
*/
/* This catches the error that a transparent type map selects a
* transparent multiviews resource as the best variant.
*
* XXX: We do not signal an error if a transparent type map
* selects a _non_transparent multiviews resource as the best
* variant, because we can generate a legal negotiation response
* in this case. In this case, the vlist_validator of the
* nontransparent subrequest will be lost however. This could
* lead to cases in which a change in the set of variants or the
* negotiation algorithm of the nontransparent resource is never
* propagated up to a HTTP/1.1 cache which interprets Vary. To be
* completely on the safe side we should return HTTP_VARIANT_ALSO_VARIES
* for this type of recursive negotiation too.
*/
if (neg->is_transparent &&
apr_table_get(sub_req->err_headers_out, "TCN")) {
return HTTP_VARIANT_ALSO_VARIES;
}
/* This catches the error that a transparent type map recursively
* selects, as the best variant, another type map which itself
* causes transparent negotiation to be done.
*
* XXX: Actually, we catch this error by catching all cases of
* type map recursion. There are some borderline recursive type
* map arrangements which would not produce transparent
* negotiation protocol errors or lack of cache propagation
* problems, but such arrangements are very hard to detect at this
* point in the control flow, so we do not bother to single them
* out.
*
* Recursive type maps imply a recursive arrangement of negotiated
* resources which is visible to outside clients, and this is not
* supported by the transparent negotiation caching protocols, so
* if we are to have generic support for recursive type maps, we
* have to create some configuration setting which makes all type
* maps non-transparent when recursion is enabled. Also, if we
* want recursive type map support which ensures propagation of
* type map changes into HTTP/1.1 caches that handle Vary, we
* would have to extend the current mechanism for generating
* variant list validators.
*/
if (sub_req->handler && strcmp(sub_req->handler, "type-map") == 0) {
return HTTP_VARIANT_ALSO_VARIES;
}
/* This adds an appropriate Variant-Vary header if the subrequest
* is a multiviews resource.
*
* XXX: TODO: Note that this does _not_ handle any Vary header
* returned by a CGI if sub_req is a CGI script, because we don't
* see that Vary header yet at this point in the control flow.
* This won't cause any cache consistency problems _unless_ the
* CGI script also returns a Cache-Control header marking the
* response as cachable. This needs to be fixed, also there are
* problems if a CGI returns an Etag header which also need to be
* fixed.
*/
if ((sub_vary = apr_table_get(sub_req->err_headers_out, "Vary")) != NULL) {
apr_table_setn(r->err_headers_out, "Variant-Vary", sub_vary);
/* Move the subreq Vary header into the main request to
* prevent having two Vary headers in the response, which
* would be legal but strange.
*/
apr_table_setn(r->err_headers_out, "Vary", sub_vary);
apr_table_unset(sub_req->err_headers_out, "Vary");
}
apr_table_setn(r->err_headers_out, "Content-Location",
ap_escape_path_segment(r->pool, variant->file_name));
set_neg_headers(r, neg, alg_choice); /* add Alternates and Vary */
/* Still to do by caller: add Expires */
return 0;
}
/****************************************************************
*
* Executive...
*/
static int do_negotiation(request_rec *r, negotiation_state *neg,
var_rec **bestp, int prefer_scripts)
{
var_rec *avail_recs = (var_rec *) neg->avail_vars->elts;
int alg_result; /* result of variant selection algorithm */
int res;
int j;
/* Decide if resource is transparently negotiable */
/* GET or HEAD? (HEAD has same method number as GET) */
if (r->method_number == M_GET) {
/* maybe this should be configurable, see also the comment
* about recursive type maps in setup_choice_response()
*/
neg->is_transparent = 1;
/* We can't be transparent if we are a map file in the middle
* of the request URI.
*/
if (r->path_info && *r->path_info)
neg->is_transparent = 0;
for (j = 0; j < neg->avail_vars->nelts; ++j) {
var_rec *variant = &avail_recs[j];
/* We can't be transparent, because of internal
* assumptions in best_match(), if there is a
* non-neighboring variant. We can have a non-neighboring
* variant when processing a type map.
*/
if (ap_strchr_c(variant->file_name, '/'))
neg->is_transparent = 0;
/* We can't be transparent, because of the behavior
* of variant typemap bodies.
*/
if (variant->body) {
neg->is_transparent = 0;
}
}
}
if (neg->is_transparent) {
parse_negotiate_header(r, neg);
}
else { /* configure negotiation on non-transparent resource */
neg->may_choose = 1;
}
maybe_add_default_accepts(neg, prefer_scripts);
alg_result = best_match(neg, bestp);
/* alg_result is one of
* alg_choice: a best variant is chosen
* alg_list: no best variant is chosen
*/
if (alg_result == alg_list) {
/* send a list response or HTTP_NOT_ACCEPTABLE error response */
neg->send_alternates = 1; /* always include Alternates header */
set_neg_headers(r, neg, alg_result);
store_variant_list(r, neg);
if (neg->is_transparent && neg->ua_supports_trans) {
/* XXX todo: expires? cachability? */
/* Some HTTP/1.0 clients are known to choke when they get
* a 300 (multiple choices) response without a Location
* header. However the 300 code response we are are about
* to generate will only reach 1.0 clients which support
* transparent negotiation, and they should be OK. The
* response should never reach older 1.0 clients, even if
* we have CacheNegotiatedDocs enabled, because no 1.0
* proxy cache (we know of) will cache and return 300
* responses (they certainly won't if they conform to the
* HTTP/1.0 specification).
*/
return HTTP_MULTIPLE_CHOICES;
}
if (!*bestp) {
ap_log_rerror(APLOG_MARK, APLOG_ERR, 0, r, APLOGNO(00690)
"no acceptable variant: %s", r->filename);
return HTTP_NOT_ACCEPTABLE;
}
}
/* Variant selection chose a variant */
/* XXX todo: merge the two cases in the if statement below */
if (neg->is_transparent) {
if ((res = setup_choice_response(r, neg, *bestp)) != 0) {
return res; /* return if error */
}
}
else {
set_neg_headers(r, neg, alg_result);
}
/* Make sure caching works - Vary should handle HTTP/1.1, but for
* HTTP/1.0, we can't allow caching at all.
*/
/* XXX: Note that we only set r->no_cache to 1, which causes
* Expires: <now> to be added, when responding to a HTTP/1.0
* client. If we return the response to a 1.1 client, we do not
* add Expires <now>, because doing so would degrade 1.1 cache
* performance by preventing re-use of the response without prior
* revalidation. On the other hand, if the 1.1 client is a proxy
* which was itself contacted by a 1.0 client, or a proxy cache
* which can be contacted later by 1.0 clients, then we currently
* rely on this 1.1 proxy to add the Expires: <now> when it
* forwards the response.
*
* XXX: TODO: Find out if the 1.1 spec requires proxies and
* tunnels to add Expires: <now> when forwarding the response to
* 1.0 clients. I (kh) recall it is rather vague on this point.
* Testing actual 1.1 proxy implementations would also be nice. If
* Expires: <now> is not added by proxies then we need to always
* include Expires: <now> ourselves to ensure correct caching, but
* this would degrade HTTP/1.1 cache efficiency unless we also add
* Cache-Control: max-age=N, which we currently don't.
*
* Roy: No, we are not going to screw over HTTP future just to
* ensure that people who can't be bothered to upgrade their
* clients will always receive perfect server-side negotiation.
* Hell, those clients are sending bogus accept headers anyway.
*
* Manual setting of cache-control/expires always overrides this
* automated kluge, on purpose.
*/
if ((!do_cache_negotiated_docs(r->server)
&& (r->proto_num < HTTP_VERSION(1,1)))
&& neg->count_multiviews_variants != 1) {
r->no_cache = 1;
}
return OK;
}
static int handle_map_file(request_rec *r)
{
negotiation_state *neg;
apr_file_t *map;
var_rec *best;
int res;
char *udir;
const char *new_req;
if(strcmp(r->handler,MAP_FILE_MAGIC_TYPE) && strcmp(r->handler,"type-map"))
return DECLINED;
neg = parse_accept_headers(r);
if ((res = read_type_map(&map, neg, r))) {
return res;
}
res = do_negotiation(r, neg, &best, 0);
if (res != 0) return res;
if (best->body)
{
conn_rec *c = r->connection;
apr_bucket_brigade *bb;
apr_bucket *e;
ap_allow_standard_methods(r, REPLACE_ALLOW, M_GET, M_OPTIONS,
M_POST, -1);
/* XXX: ?
* if (r->method_number == M_OPTIONS) {
* return ap_send_http_options(r);
*}
*/
if (r->method_number != M_GET && r->method_number != M_POST) {
return HTTP_METHOD_NOT_ALLOWED;
}
/* ### These may be implemented by adding some 'extra' info
* of the file offset onto the etag
* ap_update_mtime(r, r->finfo.mtime);
* ap_set_last_modified(r);
* ap_set_etag(r);
*/
ap_set_accept_ranges(r);
ap_set_content_length(r, best->bytes);
/* set MIME type and charset as negotiated */
if (best->mime_type && *best->mime_type) {
if (best->content_charset && *best->content_charset) {
ap_set_content_type(r, apr_pstrcat(r->pool,
best->mime_type,
"; charset=",
best->content_charset,
NULL));
}
else {
ap_set_content_type(r, apr_pstrdup(r->pool, best->mime_type));
}
}
/* set Content-language(s) as negotiated */
if (best->content_languages && best->content_languages->nelts) {
r->content_languages = apr_array_copy(r->pool,
best->content_languages);
}
/* set Content-Encoding as negotiated */
if (best->content_encoding && *best->content_encoding) {
r->content_encoding = apr_pstrdup(r->pool,
best->content_encoding);
}
if ((res = ap_meets_conditions(r)) != OK) {
return res;
}
if ((res = ap_discard_request_body(r)) != OK) {
return res;
}
bb = apr_brigade_create(r->pool, c->bucket_alloc);
apr_brigade_insert_file(bb, map, best->body, best->bytes, r->pool);
e = apr_bucket_eos_create(c->bucket_alloc);
APR_BRIGADE_INSERT_TAIL(bb, e);
return ap_pass_brigade_fchk(r, bb, NULL);
}
if (r->path_info && *r->path_info) {
/* remove any path_info from the end of the uri before trying
* to change the filename. r->path_info from the original
* request is passed along on the redirect.
*/
r->uri[ap_find_path_info(r->uri, r->path_info)] = '\0';
}
udir = ap_make_dirstr_parent(r->pool, r->uri);
udir = ap_escape_uri(r->pool, udir);
if (r->args) {
if (r->path_info) {
new_req = apr_pstrcat(r->pool, udir, best->file_name,
r->path_info, "?", r->args, NULL);
}
else {
new_req = apr_pstrcat(r->pool, udir, best->file_name,
"?", r->args, NULL);
}
}
else {
new_req = apr_pstrcat(r->pool, udir, best->file_name,
r->path_info, NULL);
}
ap_internal_redirect(new_req, r);
return OK;
}
static int handle_multi(request_rec *r)
{
negotiation_state *neg;
var_rec *best, *avail_recs;
request_rec *sub_req;
int res;
int j;
if (r->finfo.filetype != APR_NOFILE
|| !(ap_allow_options(r) & OPT_MULTI)) {
return DECLINED;
}
neg = parse_accept_headers(r);
if ((res = read_types_multi(neg))) {
return_from_multi:
/* free all allocated memory from subrequests */
avail_recs = (var_rec *) neg->avail_vars->elts;
for (j = 0; j < neg->avail_vars->nelts; ++j) {
var_rec *variant = &avail_recs[j];
if (variant->sub_req) {
ap_destroy_sub_req(variant->sub_req);
}
}
return res;
}
if (neg->avail_vars->nelts == 0) {
return DECLINED;
}
res = do_negotiation(r, neg, &best,
(r->method_number != M_GET) || r->args ||
(r->path_info && *r->path_info));
if (res != 0)
goto return_from_multi;
if (!(sub_req = best->sub_req)) {
/* We got this out of a map file, so we don't actually have
* a sub_req structure yet. Get one now.
*/
sub_req = ap_sub_req_lookup_file(best->file_name, r, r->output_filters);
if (sub_req->status != HTTP_OK) {
res = sub_req->status;
ap_destroy_sub_req(sub_req);
goto return_from_multi;
}
}
if (sub_req->args == NULL) {
sub_req->args = r->args;
}
/* now do a "fast redirect" ... promotes the sub_req into the main req */
ap_internal_fast_redirect(sub_req, r);
/* give no advise for time on this subrequest. Perhaps we
* should tally the last mtime amoung all variants, and date
* the most recent, but that could confuse the proxies.
*/
r->mtime = 0;
/* clean up all but our favorite variant, since that sub_req
* is now merged into the main request!
*/
avail_recs = (var_rec *) neg->avail_vars->elts;
for (j = 0; j < neg->avail_vars->nelts; ++j) {
var_rec *variant = &avail_recs[j];
if (variant != best && variant->sub_req) {
ap_destroy_sub_req(variant->sub_req);
}
}
return OK;
}
/**********************************************************************
* There is a problem with content-encoding, as some clients send and
* expect an x- token (e.g. x-gzip) while others expect the plain token
* (i.e. gzip). To try and deal with this as best as possible we do
* the following: if the client sent an Accept-Encoding header and it
* contains a plain token corresponding to the content encoding of the
* response, then set content encoding using the plain token. Else if
* the A-E header contains the x- token use the x- token in the C-E
* header. Else don't do anything.
*
* Note that if no A-E header was sent, or it does not contain a token
* compatible with the final content encoding, then the token in the
* C-E header will be whatever was specified in the AddEncoding
* directive.
*/
static int fix_encoding(request_rec *r)
{
const char *enc = r->content_encoding;
char *x_enc = NULL;
apr_array_header_t *accept_encodings;
accept_rec *accept_recs;
int i;
if (!enc || !*enc) {
return DECLINED;
}
if (enc[0] == 'x' && enc[1] == '-') {
enc += 2;
}
if ((accept_encodings = do_header_line(r->pool,
apr_table_get(r->headers_in, "Accept-Encoding"))) == NULL) {
return DECLINED;
}
accept_recs = (accept_rec *) accept_encodings->elts;
for (i = 0; i < accept_encodings->nelts; ++i) {
char *name = accept_recs[i].name;
if (!strcmp(name, enc)) {
r->content_encoding = name;
return OK;
}
if (name[0] == 'x' && name[1] == '-' && !strcmp(name+2, enc)) {
x_enc = name;
}
}
if (x_enc) {
r->content_encoding = x_enc;
return OK;
}
return DECLINED;
}
static void register_hooks(apr_pool_t *p)
{
ap_hook_fixups(fix_encoding,NULL,NULL,APR_HOOK_MIDDLE);
ap_hook_type_checker(handle_multi,NULL,NULL,APR_HOOK_FIRST);
ap_hook_handler(handle_map_file,NULL,NULL,APR_HOOK_MIDDLE);
}
AP_DECLARE_MODULE(negotiation) =
{
STANDARD20_MODULE_STUFF,
create_neg_dir_config, /* dir config creator */
merge_neg_dir_configs, /* dir merger --- default is to override */
NULL, /* server config */
NULL, /* merge server config */
negotiation_cmds, /* command apr_table_t */
register_hooks /* register hooks */
};