diff options
Diffstat (limited to 'src/or/geoip.c')
-rw-r--r-- | src/or/geoip.c | 215 |
1 files changed, 215 insertions, 0 deletions
diff --git a/src/or/geoip.c b/src/or/geoip.c index 14b5f66263..a7e46c0b8f 100644 --- a/src/or/geoip.c +++ b/src/or/geoip.c @@ -570,6 +570,204 @@ _c_hist_compare(const void **_a, const void **_b) return strcmp(a->country, b->country); } +/** When there are incomplete directory requests at the end of a 24-hour + * period, consider those requests running for longer than this timeout as + * failed, the others as still running. */ +#define DIRREQ_TIMEOUT (10*60) + +/** Entry in a map from either conn->global_identifier for direct requests + * or a unique circuit identifier for tunneled requests to request time, + * response size, and completion time of a network status request. Used to + * measure download times of requests to derive average client + * bandwidths. */ +typedef struct dirreqdlmap_entry_t { + directory_request_state_t state; /**< State of this directory request. */ + /** Unique identifier for this network status request; this is either the + * conn->global_identifier of the dir conn (direct request) or a new + * locally unique identifier of a circuit (tunneled request). This ID is + * only unique among other direct or tunneled requests, respectively. */ + uint64_t request_id; + /** Is this a direct or a tunneled request? */ + directory_request_type_t type; + int completed:1; /**< Is this request complete? */ + geoip_client_action_t action; /**< Is this a v2 or v3 request? */ + /** When did we receive the request and started sending the response? */ + struct timeval request_time; + size_t response_size; /**< What is the size of the response in bytes? */ + struct timeval completion_time; /**< When did the request succeed? */ +} dirreqdlmap_entry_t; + +/** Map of all directory requests asking for v2 or v3 network statuses in + * the current geoip-stats interval. Keys are strings starting with either + * "dir" for direct requests or "tun" for tunneled requests, followed by + * a unique uint64_t identifier represented as decimal string. Values are + * of type *<b>dirreqdlmap_entry_t</b>. */ +static strmap_t *dirreqdlmap = NULL; + +/** Helper: Put <b>entry</b> into map of directory requests using + * <b>tunneled</b> and <b>request_id</b> as key parts. If there is + * already an entry for that key, print out a BUG warning and return. */ +static void +_dirreqdlmap_put(dirreqdlmap_entry_t *entry, + directory_request_type_t type, uint64_t request_id) +{ + char key[3+20+1]; /* dir|tun + -9223372036854775808 + \0 */ + dirreqdlmap_entry_t *ent; + if (!dirreqdlmap) + dirreqdlmap = strmap_new(); + tor_snprintf(key, sizeof(key), "%s"U64_FORMAT, + type == REQUEST_TUNNELED ? "tun" : "dir", + U64_PRINTF_ARG(request_id)); + ent = strmap_get(dirreqdlmap, key); + if (ent) { + log_warn(LD_BUG, "Error when putting directory request into local " + "map. There is already an entry for the same identifier."); + return; + } + strmap_set(dirreqdlmap, key, entry); +} + +/** Helper: Look up and return an entry in the map of directory requests + * using <b>tunneled</b> and <b>request_id</b> as key parts. If there + * is no such entry, return NULL. */ +static dirreqdlmap_entry_t * +_dirreqdlmap_get(directory_request_type_t type, uint64_t request_id) +{ + char key[3+20+1]; /* dir|tun + -9223372036854775808 + \0 */ + if (!dirreqdlmap) + dirreqdlmap = strmap_new(); + tor_snprintf(key, sizeof(key), "%s"U64_FORMAT, + type == REQUEST_TUNNELED ? "tun" : "dir", + U64_PRINTF_ARG(request_id)); + return strmap_get(dirreqdlmap, key); +} + +/** Note that an either direct or tunneled (see <b>type</b>) directory + * request for a network status with unique ID <b>request_id</b> of size + * <b>response_size</b> and action <b>action</b> (either v2 or v3) has + * started. */ +void +geoip_start_dirreq(uint64_t request_id, size_t response_size, + geoip_client_action_t action, + directory_request_type_t type) +{ + dirreqdlmap_entry_t *ent = tor_malloc_zero(sizeof(dirreqdlmap_entry_t)); + ent->request_id = request_id; + tor_gettimeofday(&ent->request_time); + ent->response_size = response_size; + ent->action = action; + ent->type = type; + _dirreqdlmap_put(ent, type, request_id); +} + +/** Change the state of the either direct or tunneled (see <b>type</b>) + * directory request with <b>request_id</b> to <b>new_state</b> and + * possibly mark it as completed. If no entry can be found for the given + * key parts (e.g., if this is a directory request that we are not + * measuring, or one that was started in the previous measurement period), + * or if the state cannot be advanced to <b>new_state</b>, do nothing. */ +void +geoip_change_dirreq_state(uint64_t request_id, + directory_request_type_t type, + directory_request_state_t new_state) +{ + dirreqdlmap_entry_t *ent = _dirreqdlmap_get(type, request_id); + if (!ent) + return; + if (new_state == REQUEST_IS_FOR_NETWORK_STATUS) + return; + if (new_state - 1 != ent->state) + return; + ent->state = new_state; + if ((type == REQUEST_DIRECT && new_state == FLUSHING_DIR_CONN_FINISHED) || + (type == REQUEST_TUNNELED && new_state == OR_CONN_BUFFER_FLUSHED)) { + tor_gettimeofday(&ent->completion_time); + ent->completed = 1; + } +} + +#ifdef ENABLE_GEOIP_STATS +/** Return a newly allocated comma-separated string containing statistics + * on network status downloads. The string contains the number of completed + * requests, timeouts, and still running requests as well as the download + * times by deciles and quartiles. Return NULL if we have not observed + * requests for long enough. */ +static char * +geoip_get_dirreqdl_history(geoip_client_action_t action, + directory_request_type_t type) +{ + char *result = NULL; + smartlist_t *dirreqdl_times = NULL; + uint32_t complete = 0, timeouts = 0, running = 0; + int i = 0, bufsize = 1024, written; + struct timeval now; + tor_gettimeofday(&now); + if (!dirreqdlmap) + return NULL; + if (action != GEOIP_CLIENT_NETWORKSTATUS && + action != GEOIP_CLIENT_NETWORKSTATUS_V2) + return NULL; + dirreqdl_times = smartlist_create(); + STRMAP_FOREACH_MODIFY(dirreqdlmap, key, dirreqdlmap_entry_t *, ent) { + if (ent->action == action && type == ent->type) { + if (ent->completed) { + uint32_t *bytes_per_second = tor_malloc_zero(sizeof(uint32_t)); + uint32_t time_diff = (uint32_t) tv_udiff(&ent->request_time, + &ent->completion_time); + if (time_diff == 0) + time_diff = 1; /* Avoid DIV/0; "instant" answers are impossible + * anyway by law of nature or something.. */ + *bytes_per_second = 1000000 * ent->response_size / time_diff; + smartlist_add(dirreqdl_times, bytes_per_second); + complete++; + } else { + if (tv_udiff(&ent->request_time, &now) / 1000000 > DIRREQ_TIMEOUT) + timeouts++; + else + running++; + } + tor_free(ent); + MAP_DEL_CURRENT(key); + } + } STRMAP_FOREACH_END; + result = tor_malloc_zero(bufsize); + written = tor_snprintf(result, bufsize, "complete=%d,timeout=%d," + "running=%d", complete, timeouts, running); + if (written < 0) + return NULL; +#define MIN_DIR_REQ_RESPONSES 16 + if (complete >= MIN_DIR_REQ_RESPONSES) { + uint32_t *dltimes = tor_malloc(sizeof(uint32_t) * complete); + SMARTLIST_FOREACH(dirreqdl_times, uint32_t *, dlt, { + dltimes[i++] = *dlt; + tor_free(dlt); + }); + median_uint32(dltimes, complete); /* sort */ + written = tor_snprintf(result + written, bufsize - written, + ",min=%d,d1=%d,d2=%d,q1=%d,d3=%d,d4=%d,md=%d," + "d6=%d,d7=%d,q3=%d,d8=%d,d9=%d,max=%d", + dltimes[0], + dltimes[1*complete/10-1], + dltimes[2*complete/10-1], + dltimes[1*complete/4-1], + dltimes[3*complete/10-1], + dltimes[4*complete/10-1], + dltimes[5*complete/10-1], + dltimes[6*complete/10-1], + dltimes[7*complete/10-1], + dltimes[3*complete/4-1], + dltimes[8*complete/10-1], + dltimes[9*complete/10-1], + dltimes[complete-1]); + tor_free(dltimes); + } + if (written < 0) + result = NULL; + smartlist_free(dirreqdl_times); + return result; +} +#endif + /** How long do we have to have observed per-country request history before we * are willing to talk about it? */ #define GEOIP_MIN_OBSERVATION_TIME (12*60*60) @@ -785,6 +983,23 @@ dump_geoip_stats(void) goto done; } + data_v2 = geoip_get_dirreqdl_history(GEOIP_CLIENT_NETWORKSTATUS_V2, + REQUEST_DIRECT); + data_v3 = geoip_get_dirreqdl_history(GEOIP_CLIENT_NETWORKSTATUS, + REQUEST_DIRECT); + if (fprintf(out, "ns-direct-dl %s\nns-v2-direct-dl %s\n", + data_v3 ? data_v3 : "", data_v2 ? data_v2 : "") < 0) + goto done; + tor_free(data_v2); + tor_free(data_v3); + data_v2 = geoip_get_dirreqdl_history(GEOIP_CLIENT_NETWORKSTATUS_V2, + REQUEST_TUNNELED); + data_v3 = geoip_get_dirreqdl_history(GEOIP_CLIENT_NETWORKSTATUS, + REQUEST_TUNNELED); + if (fprintf(out, "ns-tunneled-dl %s\nns-v2-tunneled-dl %s\n", + data_v3 ? data_v3 : "", data_v2 ? data_v2 : "") < 0) + goto done; + finish_writing_to_file(open_file); open_file = NULL; done: |