mod_heartmonitor.c revision 6571b51afefea37aaf42df4986ec979dcd45777b
eac684ef1c29684b1bcd27a89c38c202e568e469Tom Gundersen/* Licensed to the Apache Software Foundation (ASF) under one or more
eac684ef1c29684b1bcd27a89c38c202e568e469Tom Gundersen * contributor license agreements. See the NOTICE file distributed with
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek * this work for additional information regarding copyright ownership.
eac684ef1c29684b1bcd27a89c38c202e568e469Tom Gundersen * The ASF licenses this file to You under the Apache License, Version 2.0
eac684ef1c29684b1bcd27a89c38c202e568e469Tom Gundersen * (the "License"); you may not use this file except in compliance with
eac684ef1c29684b1bcd27a89c38c202e568e469Tom Gundersen * the License. You may obtain a copy of the License at
eac684ef1c29684b1bcd27a89c38c202e568e469Tom Gundersen * Unless required by applicable law or agreed to in writing, software
eac684ef1c29684b1bcd27a89c38c202e568e469Tom Gundersen * distributed under the License is distributed on an "AS IS" BASIS,
eac684ef1c29684b1bcd27a89c38c202e568e469Tom Gundersen * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
eac684ef1c29684b1bcd27a89c38c202e568e469Tom Gundersen * See the License for the specific language governing permissions and
eac684ef1c29684b1bcd27a89c38c202e568e469Tom Gundersen * limitations under the License.
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek/* How often we update the stats file */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek/* TODO: Make a runtime config */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek#define HM_WATHCHDOG_NAME ("_heartmonitor_")
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmekstatic const ap_slotmem_provider_t *storage = NULL;
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmekstatic ap_slotmem_instance_t *slotmem = NULL;
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmekmodule AP_MODULE_DECLARE_DATA heartmonitor_module;
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmektypedef struct hm_slot_server_ctx_t {
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmekstatic apr_status_t hm_listen(hm_ctx_t *ctx)
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek rv = apr_socket_create(&ctx->sock, ctx->mcast_addr->family,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek SOCK_DGRAM, APR_PROTO_UDP, ctx->p);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: Failed to create listening socket.");
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek rv = apr_socket_opt_set(ctx->sock, APR_SO_REUSEADDR, 1);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: Failed to set APR_SO_REUSEADDR to 1 on socket.");
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek rv = apr_socket_opt_set(ctx->sock, APR_SO_NONBLOCK, 1);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: Failed to set APR_SO_REUSEADDR to 1 on socket.");
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek rv = apr_socket_bind(ctx->sock, ctx->mcast_addr);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: Failed to bind on socket.");
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek rv = apr_mcast_join(ctx->sock, ctx->mcast_addr, NULL, NULL);
5256e00e8b9015dd1a976d647fc71dc7efbd8cf8Tom Gundersen ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: Failed to join multicast group");
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek rv = apr_mcast_loopback(ctx->sock, 1);
5256e00e8b9015dd1a976d647fc71dc7efbd8cf8Tom Gundersen ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: Failed to accept localhost mulitcast on socket.");
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmekstatic void qs_to_table(const char *input, apr_table_t *parms,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek key = apr_strtok(query_string, "&", &strtok_state);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek *value = '\0'; /* Split the string in two */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek value++; /* Skip passed the = */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek apr_table_set(parms, key, value);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_rerror(APLOG_MARK, APLOG_DEBUG, 0, r,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Found query arg: %s = %s", key, value);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek key = apr_strtok(NULL, "&", &strtok_state);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek/* Store in the slotmem */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmekstatic apr_status_t hm_update(void* mem, void *data, apr_pool_t *p)
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek hm_slot_server_t *old = (hm_slot_server_t *) mem;
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek hm_slot_server_ctx_t *s = (hm_slot_server_ctx_t *) data;
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek if (strncmp(old->ip, new->ip, MAXIPSIZE)==0) {
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmekstatic apr_status_t hm_slotmem_update_stat(hm_server_t *s, request_rec *r)
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek /* We call do_all (to try to update) otherwise grab + put */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek /* TODO: REMOVE ME BEFORE PRODUCTION (????) */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_DEBUG, 0, r->server,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: %s busy=%d ready=%d", s->ip,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek storage->doall(slotmem, hm_update, &ctx, r->pool);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek memcpy(hmserver.ip, s->ip, MAXIPSIZE);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek /* XXX locking for grab() / put() */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek storage->put(slotmem, i, (unsigned char *)&hmserver, sizeof(hmserver));
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek/* Copied from mod_lbmethod_heartbeat.c... */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmekargstr_to_table(apr_pool_t *p, char *str, apr_table_t *parms)
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek key = apr_strtok(str, "&", &strtok_state);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek *value = '\0'; /* Split the string in two */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek value++; /* Skip passed the = */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek apr_table_set(parms, key, value);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_rerror(APLOG_MARK, APLOG_DEBUG, 0, r,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Found query arg: %s = %s", key, value);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek key = apr_strtok(NULL, "&", &strtok_state);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmekstatic apr_status_t hm_file_update_stat(hm_ctx_t *ctx, hm_server_t *s, apr_pool_t *pool)
56fd6bf795926409b087bce406ea851ad89f9fe8Tom Gundersen unsigned int fage;
d0d6a4cd70477970812bff0a37e70f66208d7c14Tom Gundersen char *path = apr_pstrcat(pool, ctx->storage_path, ".tmp.XXXXXX", NULL);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek /* TODO: Update stats file (!) */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek rv = apr_file_mktemp(&fp, path, APR_CREATE | APR_WRITE, pool);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: Unable to open tmp file: %s", path);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek rv = apr_file_open(&fpin, ctx->storage_path, APR_READ|APR_BINARY|APR_BUFFERED,
113bfde15f9393fa8bc22cbd839c0bc64e733ee2Tom Gundersen apr_bucket_alloc_t *ba = apr_bucket_alloc_create(pool);
113bfde15f9393fa8bc22cbd839c0bc64e733ee2Tom Gundersen apr_bucket_brigade *bb = apr_brigade_create(pool, ba);
113bfde15f9393fa8bc22cbd839c0bc64e733ee2Tom Gundersen apr_bucket_brigade *tmpbb = apr_brigade_create(pool, ba);
113bfde15f9393fa8bc22cbd839c0bc64e733ee2Tom Gundersen rv = apr_file_info_get(&fi, APR_FINFO_SIZE | APR_FINFO_MTIME, fpin);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: Unable to read file: %s", ctx->storage_path);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek /* Read the file and update the line corresponding to the node */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ba = apr_bucket_alloc_create(pool);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek bb = apr_brigade_create(pool, ba);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek apr_brigade_insert_file(bb, fpin, 0, fi.size, pool);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek tmpbb = apr_brigade_create(pool, ba);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek fage = (unsigned int) apr_time_sec(now - fi.mtime);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek rv = apr_brigade_split_line(tmpbb, bb,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: Unable to read from file: %s", ctx->storage_path);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek apr_brigade_flatten(tmpbb, buf, &bsize);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ip = apr_pstrndup(pool, buf, t - buf);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek /* copy things we can't process */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek apr_file_printf(fp, "%s\n", buf);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek } else if (strcmp(ip, s->ip) !=0 ) {
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek /* Update seen time according to the last file modification */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek argstr_to_table(pool, apr_pstrdup(pool, t), hbt);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek if (apr_table_get(hbt, "busy")) {
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek node.busy = atoi(apr_table_get(hbt, "busy"));
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek if (apr_table_get(hbt, "ready")) {
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek node.ready = atoi(apr_table_get(hbt, "ready"));
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek if (apr_table_get(hbt, "lastseen")) {
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek node.seen = atoi(apr_table_get(hbt, "lastseen"));
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek apr_file_printf(fp, "%s &ready=%u&busy=%u&lastseen=%u\n",
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ip, node.ready, node.busy, (unsigned int) seen);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek seen = apr_time_sec(now - s->seen);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek apr_file_printf(fp, "%s &ready=%u&busy=%u&lastseen=%u\n",
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek s->ip, s->ready, s->busy, (unsigned int) seen);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek seen = apr_time_sec(now - s->seen);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek apr_file_printf(fp, "%s &ready=%u&busy=%u&lastseen=%u\n",
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek s->ip, s->ready, s->busy, (unsigned int) seen);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: Unable to flush file: %s", path);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: Unable to close file: %s", path);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek APR_FPROT_UREAD | APR_FPROT_GREAD |
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek if (rv && rv != APR_INCOMPLETE) {
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: Unable to set file permssions on %s",
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek rv = apr_file_rename(path, ctx->storage_path, pool);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: Unable to move file: %s -> %s", path,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmekstatic apr_status_t hm_update_stat(hm_ctx_t *ctx, hm_server_t *s, request_rec *r)
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek return hm_slotmem_update_stat(s, r);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek return hm_file_update_stat(ctx, s, r->pool);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek/* Store in a file */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmekstatic apr_status_t hm_file_update_stats(hm_ctx_t *ctx, apr_pool_t *p)
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek char *path = apr_pstrcat(p, ctx->storage_path, ".tmp.XXXXXX", NULL);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek /* TODO: Update stats file (!) */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek rv = apr_file_mktemp(&fp, path, APR_CREATE | APR_WRITE, p);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: Unable to open tmp file: %s", path);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek for (hi = apr_hash_first(p, ctx->servers);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek hi != NULL; hi = apr_hash_next(hi)) {
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek apr_hash_this(hi, NULL, NULL, (void **) &s);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek seen = apr_time_sec(now - s->seen);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek * Skip this entry from the heartbeat file -- when it comes back,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek * we will reuse the memory...
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek apr_file_printf(fp, "%s &ready=%u&busy=%u&lastseen=%u\n",
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek s->ip, s->ready, s->busy, (unsigned int) seen);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: Unable to flush file: %s", path);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: Unable to close file: %s", path);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek APR_FPROT_UREAD | APR_FPROT_GREAD |
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek if (rv && rv != APR_INCOMPLETE) {
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: Unable to set file permssions on %s",
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek rv = apr_file_rename(path, ctx->storage_path, p);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: Unable to move file: %s -> %s", path,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmekstatic hm_server_t *hm_get_server(hm_ctx_t *ctx, const char *ip)
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek s = apr_hash_get(ctx->servers, ip, APR_HASH_KEY_STRING);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek s = apr_palloc(ctx->p, sizeof(hm_server_t));
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek s->ip = apr_pstrdup(ctx->p, ip);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek apr_hash_set(ctx->servers, s->ip, APR_HASH_KEY_STRING, s);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek/* Process a message receive from a backend node */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmekstatic void hm_processmsg(hm_ctx_t *ctx, apr_pool_t *p,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek apr_sockaddr_t *from, char *buf, int len)
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek if (apr_table_get(tbl, "v") != NULL &&
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek apr_table_get(tbl, "busy") != NULL &&
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek apr_table_get(tbl, "ready") != NULL) {
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek /* TODO: REMOVE ME BEFORE PRODUCTION (????) */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_DEBUG, 0, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: %pI busy=%s ready=%s", from,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek apr_table_get(tbl, "busy"), apr_table_get(tbl, "ready"));
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek s->busy = atoi(apr_table_get(tbl, "busy"));
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek s->ready = atoi(apr_table_get(tbl, "ready"));
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, 0, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: malformed message from %pI",
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek/* Read message from multicast socket */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmekstatic apr_status_t hm_recv(hm_ctx_t *ctx, apr_pool_t *p)
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek rv = apr_socket_recvfrom(&from, ctx->sock, 0, buf, &len);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: would block");
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: recvfrom failed");
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek hm_processmsg(ctx, p, &from, buf, len);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmekstatic apr_status_t hm_watchdog_callback(int state, void *data,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek hm_ctx_t *ctx = (hm_ctx_t *)data;
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek case AP_WATCHDOG_STATE_STARTING:
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: Unable to listen for connections!");
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_DEBUG, 0, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: %s listener started.",
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek /* XXX slotmem, if used by the handler is that looks a bad ideas (we are not the one receiving the information */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek hm_file_update_stats(ctx, pool);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek cur = now = apr_time_sec(apr_time_now());
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek /* TODO: Insted HN_UPDATE_SEC use
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek * the ctx->interval
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek while ((now - cur) < apr_time_sec(ctx->interval)) {
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek pfd.desc_type = APR_POLL_SOCKET;
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek rc = apr_poll(&pfd, 1, &n, timeout);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek if (rc == APR_SUCCESS && (pfd.rtnevents & APR_POLLIN)) {
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek now = apr_time_sec(apr_time_now());
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek case AP_WATCHDOG_STATE_STOPPING:
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_DEBUG, 0, ctx->s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: stopping %s listener.",
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmekstatic int hm_post_config(apr_pool_t *p, apr_pool_t *plog,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek apr_pool_t *ptemp, server_rec *s)
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek const char *userdata_key = "mod_heartmonitor_init";
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek hm_ctx_t *ctx = ap_get_module_config(s->module_config,
eac684ef1c29684b1bcd27a89c38c202e568e469Tom Gundersen /* Create the slotmem */
eac684ef1c29684b1bcd27a89c38c202e568e469Tom Gundersen apr_pool_userdata_get(&data, userdata_key, s->process->pool);
eac684ef1c29684b1bcd27a89c38c202e568e469Tom Gundersen /* first call do nothing */
eac684ef1c29684b1bcd27a89c38c202e568e469Tom Gundersen apr_pool_userdata_set((const void *)1, userdata_key, apr_pool_cleanup_null, s->process->pool);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek storage = ap_lookup_provider(AP_SLOTMEM_PROVIDER_GROUP, "shared", "0");
eac684ef1c29684b1bcd27a89c38c202e568e469Tom Gundersen ap_log_error(APLOG_MARK, APLOG_NOERRNO|APLOG_EMERG, 0, s, "ap_lookup_provider %s failed", AP_SLOTMEM_PROVIDER_GROUP);
eac684ef1c29684b1bcd27a89c38c202e568e469Tom Gundersen storage->create(&slotmem, "mod_heartmonitor", sizeof(hm_slot_server_t), maxworkers, AP_SLOTMEM_TYPE_PREGRAB, p);
b85595b511d3d9f67940f7de0265fb78d672fe81Hong Shick Pak ap_log_error(APLOG_MARK, APLOG_NOERRNO|APLOG_EMERG, 0, s, "slotmem_create for status failed");
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, s,
f47c5c47d1a7bcfa1842ff7cc52b1f7fc1d86bcfpoma "Heartmonitor: Failed to create watchdog "
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "instance (%s)", HM_WATHCHDOG_NAME);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek /* Register a callback with zero interval. */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_log_error(APLOG_MARK, APLOG_CRIT, rv, s,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek "Heartmonitor: Failed to register watchdog "
0a8a0fad010018be0f46d1c2e077ade0eb27c7dbTom Gundersen "Heartmonitor: wd callback %s", HM_WATHCHDOG_NAME);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmekstatic int hm_handler(request_rec *r)
0a8a0fad010018be0f46d1c2e077ade0eb27c7dbTom Gundersen hm_ctx_t *ctx = ap_get_module_config(r->server->module_config,
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek buf = apr_pcalloc(r->pool, MAX_MSG_LEN);
0a8a0fad010018be0f46d1c2e077ade0eb27c7dbTom Gundersen input_brigade = apr_brigade_create(r->connection->pool, r->connection->bucket_alloc);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek status = ap_get_brigade(r->input_filters, input_brigade, AP_MODE_READBYTES, APR_BLOCK_READ, MAX_MSG_LEN);
0a8a0fad010018be0f46d1c2e077ade0eb27c7dbTom Gundersen apr_brigade_flatten(input_brigade, buf, &len);
0a8a0fad010018be0f46d1c2e077ade0eb27c7dbTom Gundersen /* we can't use hm_processmsg because it uses hm_get_server() */
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek tbl = apr_table_make(r->pool, 10);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek apr_sockaddr_ip_get(&ip, r->connection->remote_addr);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek hmserver.busy = atoi(apr_table_get(tbl, "busy"));
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek hmserver.ready = atoi(apr_table_get(tbl, "ready"));
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek hm_update_stat(ctx, &hmserver, r);
798d3a524ea57aaf40cb53858aaa45ec702f012dZbigniew Jędrzejewski-Szmek ap_set_content_type(r, "text/plain");
return OK;
ctx->s = s;
return ctx;
return err;
return NULL;
char *host_str;
char *scope_id;
return err;
if (rv) {
if (port == 0) {
if (rv) {
return NULL;
return err;
return NULL;
{NULL}