/* $Header: /cvs/src/chrony/sources.c,v 1.33 2003/09/22 21:22:30 richard Exp $ ======================================================================= chronyd/chronyc - Programs for keeping computer clocks accurate. ********************************************************************** * Copyright (C) Richard P. Curnow 1997-2003 * * This program is free software; you can redistribute it and/or modify * it under the terms of version 2 of the GNU General Public License as * published by the Free Software Foundation. * * This program is distributed in the hope that it will be useful, but * WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU * General Public License for more details. * * You should have received a copy of the GNU General Public License along * with this program; if not, write to the Free Software Foundation, Inc., * 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA * ********************************************************************** ======================================================================= The routines in this file manage the complete pool of sources that we might be synchronizing to. This includes NTP sources and others (e.g. local reference clocks, eyeball + wristwatch etc). */ #include "sysincl.h" #include "sources.h" #include "sourcestats.h" #include "memory.h" #include "ntp.h" /* For NTP_Leap */ #include "local.h" #include "reference.h" #include "util.h" #include "conf.h" #include "logging.h" #include "reports.h" #include "nameserv.h" #include "mkdirpp.h" /* ================================================== */ /* Flag indicating that we are initialised */ static int initialised = 0; /* ================================================== */ /* Structure used to hold info for selecting between sources */ struct SelectInfo { int stratum; int select_ok; double variance; double root_delay; double root_dispersion; double root_distance; double best_offset; double lo_limit; double hi_limit; }; /* ================================================== */ /* This enum contains the flag values that are used to label each source */ typedef enum { SRC_OK, /* OK so far */ SRC_UNREACHABLE, /* Source is not reachable */ SRC_BAD_STATS, /* Stats driver could not supply valid data */ SRC_FALSETICKER, /* Source is found to be a falseticker */ SRC_JITTERY, /* Source scatter worse than other's dispersion */ SRC_SELECTABLE, /* Source is acceptable candidate */ SRC_SYNC /* Current synchronisation source */ } SRC_Status; /* ================================================== */ /* Define the instance structure used to hold information about each source */ struct SRC_Instance_Record { SST_Stats stats; NTP_Leap leap_status; /* Leap status */ int index; /* Index back into the array of source */ unsigned long ref_id; /* The reference ID of this source (i.e. its IP address, NOT the reference _it_ is sync'd to) */ /* Flag indicating that we are receiving packets with valid headers from this source and can use it as a reference */ int reachable; /* Flag indicating the status of the source */ SRC_Status status; struct SelectInfo sel_info; }; /* ================================================== */ /* Structure used to build the sort list for finding falsetickers */ struct Sort_Element { int index; double offset; enum {LOW=-1, CENTRE=0, HIGH=1} tag; }; /* ================================================== */ /* Table of sources */ static struct SRC_Instance_Record **sources; static struct Sort_Element *sort_list; static int *sel_sources; static int n_sources; /* Number of sources currently in the table */ static int max_n_sources; /* Capacity of the table */ #define INVALID_SOURCE (-1) static int selected_source_index; /* Which source index is currently selected (set to INVALID_SOURCE if no current valid reference) */ /* ================================================== */ /* Forward prototype */ static void slew_sources(struct timeval *raw, struct timeval *cooked, double dfreq, double afreq, double doffset, int is_step_change, void *anything); /* ================================================== */ /* Initialisation function */ void SRC_Initialise(void) { sources = NULL; sort_list = NULL; n_sources = 0; max_n_sources = 0; selected_source_index = INVALID_SOURCE; initialised = 1; LCL_AddParameterChangeHandler(slew_sources, NULL); return; } /* ================================================== */ /* Finalisation function */ void SRC_Finalise(void) { LCL_RemoveParameterChangeHandler(slew_sources, NULL); initialised = 0; return; } /* ================================================== */ /* Function to create a new instance. This would be called by one of the individual source-type instance creation routines. */ SRC_Instance SRC_CreateNewInstance(unsigned long ref_id) { SRC_Instance result; if (!initialised) { CROAK("Should be initialised"); } result = MallocNew(struct SRC_Instance_Record); result->stats = SST_CreateInstance(ref_id); if (n_sources == max_n_sources) { /* Reallocate memory */ max_n_sources += 32; if (sources) { sources = ReallocArray(struct SRC_Instance_Record *, max_n_sources, sources); sort_list = ReallocArray(struct Sort_Element, 3*max_n_sources, sort_list); sel_sources = ReallocArray(int, max_n_sources, sel_sources); } else { sources = MallocArray(struct SRC_Instance_Record *, max_n_sources); sort_list = MallocArray(struct Sort_Element, 3*max_n_sources); sel_sources = MallocArray(int, max_n_sources); } } sources[n_sources] = result; result->index = n_sources; result->leap_status = LEAP_Normal; result->ref_id = ref_id; result->reachable = 0; result->status = SRC_BAD_STATS; n_sources++; return result; } /* ================================================== */ /* Function to get rid of a source when it is being unconfigured. This may cause the current reference source to be reselected, if this was the reference source or contributed significantly to a falseticker decision. */ void SRC_DestroyInstance(SRC_Instance instance) { int dead_index, i; if (!initialised) { CROAK("Should be initialised"); } if (instance->index == selected_source_index) { instance->reachable = 0; SRC_SelectSource(0); } SST_DeleteInstance(instance->stats); dead_index = instance->index; for (i=dead_index; iindex = i; } --n_sources; Free(instance); if (selected_source_index > dead_index) { --selected_source_index; } } /* ================================================== */ /* Function to get the range of frequencies, relative to the given source, that we believe the local clock lies within. The return values are in terms of the number of seconds fast (+ve) or slow (-ve) relative to the source that the local clock becomes after a given amount of local time has elapsed. Suppose the initial offset relative to the source is U (fast +ve, slow -ve) and a time interval T elapses measured in terms of the local clock. Then the error relative to the source at the end of the interval should lie in the interval [U+T*lo, U+T*hi]. */ void SRC_GetFrequencyRange(SRC_Instance instance, double *lo, double *hi) { if (!initialised) { CROAK("Should be initialised"); } SST_GetFrequencyRange(instance->stats, lo, hi); return; } /* ================================================== */ /* This function is called by one of the source drivers when it has a new sample that is to be accumulated. This function causes the frequency estimation to be re-run for the designated source, and the clock selection procedure to be re-run afterwards. Parameters are described in sources.h */ void SRC_AccumulateSample (SRC_Instance inst, struct timeval *sample_time, double offset, double peer_delay, double peer_dispersion, double root_delay, double root_dispersion, int stratum, NTP_Leap leap_status) { if (!initialised) { CROAK("Should be initialised"); } inst->leap_status = leap_status; #ifdef TRACEON LOG(LOGS_INFO, LOGF_Sources, "ip=[%s] t=%s ofs=%f del=%f disp=%f str=%d", UTI_IPToDottedQuad(inst->ref_id), UTI_TimevalToString(sample_time), -offset, root_delay, root_dispersion, stratum); #endif /* WE HAVE TO NEGATE OFFSET IN THIS CALL, IT IS HERE THAT THE SENSE OF OFFSET IS FLIPPED */ SST_AccumulateSample(inst->stats, sample_time, -offset, peer_delay, peer_dispersion, root_delay, root_dispersion, stratum); SST_DoNewRegression(inst->stats); /* And redo clock selection */ SRC_SelectSource(inst->ref_id); return; } /* ================================================== */ void SRC_SetReachable(SRC_Instance inst) { inst->reachable = 1; #ifdef TRACEON LOG(LOGS_INFO, LOGF_Sources, "%s", UTI_IPToDottedQuad(inst->ref_id)); #endif /* Don't do selection at this point, though - that will come about in due course when we get some useful data from the source */ } /* ================================================== */ void SRC_UnsetReachable(SRC_Instance inst) { inst->reachable = 0; #ifdef TRACEON LOG(LOGS_INFO, LOGF_Sources, "%s%s", UTI_IPToDottedQuad(inst->ref_id), (inst->index == selected_source_index) ? "(REF)":""); #endif /* If this was the previous reference source, we have to reselect! */ if (inst->index == selected_source_index) { SRC_SelectSource(0); } } /* ================================================== */ static int compare_sort_elements(const void *a, const void *b) { const struct Sort_Element *u = (const struct Sort_Element *) a; const struct Sort_Element *v = (const struct Sort_Element *) b; if (u->offset < v->offset) { return -1; } else if (u->offset > v->offset) { return +1; } else if (u->tag < v->tag) { return -1; } else if (u->tag > v->tag) { return +1; } else { return 0; } } /* ================================================== */ /* This function selects the current reference from amongst the pool of sources we are holding. Updates are only made to the local reference if match_addr is zero or is equal to the selected reference source address */ void SRC_SelectSource(unsigned long match_addr) { int i, j, index; struct timeval now; double local_clock_err; int src_select_ok; double src_offset, src_offset_sd, src_frequency, src_skew; double src_accrued_dispersion; int n_endpoints, j1, j2; double best_lo, best_hi; int depth, best_depth; int n_sel_sources; double distance, min_distance; int stratum, min_stratum; int min_distance_index; struct SelectInfo *si; double total_root_dispersion; int n_reachable_sources; NTP_Leap leap_status = LEAP_Normal; if (n_sources == 0) { /* In this case, we clearly cannot synchronise to anything */ if (selected_source_index != INVALID_SOURCE) { LOG(LOGS_INFO, LOGF_Sources, "Can't synchronise: no sources"); } selected_source_index = INVALID_SOURCE; REF_SetUnsynchronised(); return; } LCL_ReadCookedTime(&now, &local_clock_err); /* Step 1 - build intervals about each source */ n_endpoints = 0; n_reachable_sources = 0; for (i=0; ireachable) { ++n_reachable_sources; si = &(sources[i]->sel_info); SST_GetSelectionData(sources[i]->stats, &now, &(si->stratum), &(si->best_offset), &(si->root_delay), &(si->root_dispersion), &(si->variance), &(si->select_ok)); /* Eventually this might be a flag indicating whether the get selection data call was successful. For now it always is. */ src_select_ok = 1; si->root_distance = si->root_dispersion + 0.5 * fabs(si->root_delay); si->lo_limit = si->best_offset - si->root_distance; si->hi_limit = si->best_offset + si->root_distance; #if 0 LOG(LOGS_INFO, LOGF_Sources, "%s off=%f dist=%f lo=%f hi=%f", UTI_IPToDottedQuad(sources[i]->ref_id), si->best_offset, si->root_distance, si->lo_limit, si->hi_limit); #endif if (src_select_ok) { sources[i]->status = SRC_OK; /* For now */ /* Otherwise it will be hard to pick this one later! However, this test might be too strict, we might want to dump it */ j1 = n_endpoints; j2 = j1 + 1; sort_list[j1].index = i; sort_list[j1].offset = si->lo_limit; sort_list[j1].tag = LOW; sort_list[j2].index = i; sort_list[j2].offset = si->hi_limit; sort_list[j2].tag = HIGH; n_endpoints += 2; } else { sources[i]->status = SRC_BAD_STATS; } } else { /* If the source is not reachable, there is no way we will pick it. */ sources[i]->status = SRC_UNREACHABLE; } } #if 0 LOG(LOGS_INFO, LOGF_Sources, "n_endpoints=%d", n_endpoints); #endif /* Now sort the endpoint list */ if (n_endpoints > 0) { /* Sort the list into order */ qsort((void *) sort_list, n_endpoints, sizeof(struct Sort_Element), compare_sort_elements); /* Now search for the interval which is contained in the most individual source intervals. Any source which overlaps this will be a candidate. If we get a case like <-----------------------> <--> <--> <===========> we will build the interval as shown with '=', whereas with an extra source we get <-----------------------> <-------> <--> <--> <==> The first case is just bad luck - we need extra sources to detect the falseticker, so just make an arbitrary choice based on stratum & stability etc. */ depth = best_depth = 0; best_lo = best_hi = 0.0; for (i=0; iref_id)); #endif switch(sort_list[i].tag) { case LOW: depth++; if (depth > best_depth) { best_depth = depth; best_lo = sort_list[i].offset; } break; case CENTRE: CROAK("CENTRE cannot occur"); break; case HIGH: if (depth == best_depth) { best_hi = sort_list[i].offset; } depth--; break; } } #if 0 LOG(LOGS_INFO, LOGF_Sources, "best_depth=%d best_lo=%f best_hi=%f", best_depth, best_lo, best_hi); #endif if (best_depth <= n_reachable_sources/2) { /* Could not even get half the reachable sources to agree - clearly we can't synchronise. srcs #to agree 1 1 2 2 3 2 4 3 etc */ if (selected_source_index != INVALID_SOURCE) { LOG(LOGS_INFO, LOGF_Sources, "Can't synchronise: no majority"); } selected_source_index = INVALID_SOURCE; REF_SetUnsynchronised(); /* .. and mark all sources as falsetickers (so they appear thus on the outputs from the command client) */ for (i=0; istatus = SRC_FALSETICKER; } } else { /* We have our interval, now work out which source are in it, i.e. build list of admissible sources. */ n_sel_sources = 0; for (i=0; istatus == SRC_OK) { /* This should be the same condition to get into the endpoint list */ /* Check if source's interval contains the best interval, or is wholly contained within it */ if (((sources[i]->sel_info.lo_limit <= best_lo) && (sources[i]->sel_info.hi_limit >= best_hi)) || ((sources[i]->sel_info.lo_limit >= best_lo) && (sources[i]->sel_info.hi_limit <= best_hi))) { sel_sources[n_sel_sources++] = i; #if 0 LOG(LOGS_INFO, LOGF_Sources, "i=%d addr=%s is valid", i, UTI_IPToDottedQuad(sources[i]->ref_id)); #endif } else { sources[i]->status = SRC_FALSETICKER; #if 0 LOG(LOGS_INFO, LOGF_Sources, "i=%d addr=%s is a falseticker", i, UTI_IPToDottedQuad(sources[i]->ref_id)); #endif } } } /* We now have a list of indices for the sources which pass the false-ticker test. Now go on to reject those whose variance is greater than the minimum distance of any other */ /* Find minimum distance */ index = sel_sources[0]; min_distance = sources[index]->sel_info.root_distance; for (i=1; isel_info.root_distance; if (distance < min_distance) { min_distance = distance; } } #if 0 LOG(LOGS_INFO, LOGF_Sources, "min_distance=%f", min_distance); #endif /* Now go through and prune any sources that have excessive variance */ for (i=0; isel_info.variance > min_distance) { sel_sources[i] = INVALID_SOURCE; sources[index]->status = SRC_JITTERY; #if 0 LOG(LOGS_INFO, LOGF_Sources, "i=%d addr=%s has too much variance", i, UTI_IPToDottedQuad(sources[i]->ref_id)); #endif } } /* Now crunch the list and mark all sources as selectable */ for (i=j=0; istatus = SRC_SELECTABLE; sel_sources[j++] = sel_sources[i]; index++; } } n_sel_sources = j; /* Now find minimum stratum. If none are left now, tough. RFC1305 is not so harsh on pruning sources due to excess variance, which prevents this from happening */ if (n_sel_sources > 0) { index = sel_sources[0]; min_stratum = sources[index]->sel_info.stratum; for (i=1; isel_info.stratum; if (stratum < min_stratum) min_stratum = stratum; } #if 0 LOG(LOGS_INFO, LOGF_Sources, "min_stratum=%d", min_stratum); #endif /* Does the current source have this stratum and is it still a survivor? */ if ((selected_source_index == INVALID_SOURCE) || (sources[selected_source_index]->status != SRC_SELECTABLE) || (sources[selected_source_index]->sel_info.stratum > min_stratum)) { /* We have to elect a new synchronisation source */ min_distance_index = INVALID_SOURCE; for (i=0; isel_info.stratum == min_stratum) { if ((min_distance_index == INVALID_SOURCE) || (sources[index]->sel_info.root_distance < min_distance)) { min_distance = sources[index]->sel_info.root_distance; min_distance_index = index; } } } selected_source_index = min_distance_index; LOG(LOGS_INFO, LOGF_Sources, "Selected source %s", UTI_IPToDottedQuad(sources[selected_source_index]->ref_id)); #if 0 LOG(LOGS_INFO, LOGF_Sources, "new_sel_index=%d", min_distance_index); #endif } else { /* We retain the existing sync source, see p40 of RFC1305b.ps */ #if 0 LOG(LOGS_INFO, LOGF_Sources, "existing reference retained", min_distance_index); #endif } sources[selected_source_index]->status = SRC_SYNC; /* Now just use the statistics of the selected source for trimming the local clock */ LCL_ReadCookedTime(&now, &local_clock_err); SST_GetTrackingData(sources[selected_source_index]->stats, &now, &src_offset, &src_offset_sd, &src_accrued_dispersion, &src_frequency, &src_skew); total_root_dispersion = (src_accrued_dispersion + sources[selected_source_index]->sel_info.root_dispersion); if ((match_addr == 0) || (match_addr == sources[selected_source_index]->ref_id)) { REF_SetReference(min_stratum, leap_status, sources[selected_source_index]->ref_id, &now, src_offset, src_frequency, src_skew, sources[selected_source_index]->sel_info.root_delay, total_root_dispersion); } } else { if (selected_source_index != INVALID_SOURCE) { LOG(LOGS_INFO, LOGF_Sources, "Can't synchronise: no selectable sources"); } selected_source_index = INVALID_SOURCE; REF_SetUnsynchronised(); } } } else { /* No sources provided valid endpoints */ if (selected_source_index != INVALID_SOURCE) { LOG(LOGS_INFO, LOGF_Sources, "Can't synchronise: no reachable sources"); } selected_source_index = INVALID_SOURCE; REF_SetUnsynchronised(); } } /* ================================================== */ double SRC_PredictOffset(SRC_Instance inst, struct timeval *when) { return SST_PredictOffset(inst->stats, when); } /* ================================================== */ double SRC_MinRoundTripDelay(SRC_Instance inst) { return SST_MinRoundTripDelay(inst->stats); } /* ================================================== */ /* This routine is registered as a callback with the local clock module, to be called whenever the local clock changes frequency or is slewed. It runs through all the existing source statistics, and adjusts them to make them look as though they were sampled under the new regime. */ static void slew_sources(struct timeval *raw, struct timeval *cooked, double dfreq, double afreq, double doffset, int is_step_change, void *anything) { int i; for (i=0; istats, cooked, dfreq, doffset); } } /* ================================================== */ /* This is called to dump out the source measurement registers */ void SRC_DumpSources(void) { FILE *out; int direc_len, file_len; char *filename; unsigned int a, b, c, d; int i; char *direc; direc = CNF_GetDumpDir(); direc_len = strlen(direc); file_len = direc_len + 24; filename = MallocArray(char, file_len); /* a bit of slack */ if (mkdir_and_parents(direc)) { for (i=0; iref_id) >> 24; b = ((sources[i]->ref_id) >> 16) & 0xff; c = ((sources[i]->ref_id) >> 8) & 0xff; d = ((sources[i]->ref_id)) & 0xff; snprintf(filename, file_len-1, "%s/%d.%d.%d.%d.dat", direc, a, b, c, d); out = fopen(filename, "w"); if (!out) { LOG(LOGS_WARN, LOGF_Sources, "Could not open dump file %s", filename); } else { SST_SaveToFile(sources[i]->stats, out); fclose(out); } } } else { LOG(LOGS_ERR, LOGF_Sources, "Could not create directory %s", direc); } Free(filename); } /* ================================================== */ void SRC_ReloadSources(void) { FILE *in; char *filename; unsigned int a, b, c, d; int i; char *dumpdir; int dumpdirlen, filelen; for (i=0; iref_id) >> 24; b = ((sources[i]->ref_id) >> 16) & 0xff; c = ((sources[i]->ref_id) >> 8) & 0xff; d = ((sources[i]->ref_id)) & 0xff; dumpdir = CNF_GetDumpDir(); dumpdirlen = strlen(dumpdir); filelen = dumpdirlen + 24; filename = MallocArray(char, filelen); snprintf(filename, filelen-1, "%s/%d.%d.%d.%d.dat", dumpdir, a, b, c, d); in = fopen(filename, "r"); if (!in) { LOG(LOGS_WARN, LOGF_Sources, "Could not open dump file %s", filename); } else { if (SST_LoadFromFile(sources[i]->stats, in)) { /* We might want to use SST_DoUpdateRegression here, but we need to check it has the same functionality */ SST_DoNewRegression(sources[i]->stats); } else { LOG(LOGS_WARN, LOGF_Sources, "Problem loading from file %s", filename); } fclose(in); } Free(filename); } } /* ================================================== */ int SRC_IsSyncPeer(SRC_Instance inst) { if (inst->index == selected_source_index) { return 1; } else { return 0; } } /* ================================================== */ int SRC_ReadNumberOfSources(void) { return n_sources; } /* ================================================== */ int SRC_ReportSource(int index, RPT_SourceReport *report, struct timeval *now) { SRC_Instance src; if ((index >= n_sources) || (index < 0)) { return 0; } else { src = sources[index]; report->ip_addr = src->ref_id; switch (src->status) { case SRC_SYNC: report->state = RPT_SYNC; break; case SRC_JITTERY: report->state = RPT_JITTERY; break; case SRC_UNREACHABLE: report->state = RPT_UNREACH; break; case SRC_FALSETICKER: report->state = RPT_FALSETICKER; break; default: report->state = RPT_OTHER; break; } /* Call stats module to fill out estimates */ SST_DoSourceReport(src->stats, report, now); return 1; } } /* ================================================== */ int SRC_ReportSourcestats(int index, RPT_SourcestatsReport *report) { SRC_Instance src; if ((index >= n_sources) || (index < 0)) { return 0; } else { src = sources[index]; report->ip_addr = src->ref_id; SST_DoSourcestatsReport(src->stats, report); return 1; } } /* ================================================== */ SRC_Skew_Direction SRC_LastSkewChange(SRC_Instance inst) { SRC_Skew_Direction result = SRC_Skew_Nochange; switch (SST_LastSkewChange(inst->stats)) { case SST_Skew_Decrease: result = SRC_Skew_Decrease; break; case SST_Skew_Nochange: result = SRC_Skew_Nochange; break; case SST_Skew_Increase: result = SRC_Skew_Increase; break; } return result; } /* ================================================== */