timed(8) の実装を読む[前編] - インターネット時刻同期の歴史(その3) | I know I believe in nothing but it is my sweet nothing

マスター側のコードを読む

マスターとなった timed(8) は 240 秒ごとにスレーブのコマンドをポーリングする。

なお実装はビジーウェイトで gettimeofday(2) システムコールを連打し 240 秒経過したらメッセージ処理というやべーコード。現代の感覚だとタイマーお使いにならないんですか(油汗)って言いたくなるが当時のヒッピー文化でタイマーとは吸うものなのだ(ジミヘンのパープルヘイズを聴きながら)。

4.3BSD/usr/src/etc/timed/globals.h#22

22 #define SAMPLEINTVL	240		/* synch() freq for master, sec */

4.3BSD/usr/src/etc/timed/master.c#38

master()
{
...
long pollingtime;
...
struct tsp *msg, to;
...
pollingtime = 0;

loop:
(void)gettimeofday(&time, (struct timezone *)0);
if (time.tv_sec >= pollingtime) {
	pollingtime = time.tv_sec + SAMPLEINTVL;
	synch(0L);
...
}
...
msg = readmsg(TSP_ANY, (char *)ANYADDR, &wait, (struct netinfo *)NULL);
if (msg != NULL) {
	switch (msg->tsp_type) {
...
	}
}
goto loop;
}

synch() で時刻調整を行うのだがこの部分はメインディッシュだから後回しにする。

TSP_SLAVEUP コマンドを処理する

ネットワーク上に新たなスレーブ候補が現れて参加を求めてるのが TSP_SLAVEUP コマンド、お前が奴隷調教志願の豚か(鞭の音)？

4.3BSD/usr/src/etc/timed/master.c#101

	case TSP_SLAVEUP:
		ind = addmach(msg->tsp_name, &from);
		newslave(ind, msg->tsp_seq);
		break;

この時マスターがやることは

addmach() … 奴隷リストに追加
newslave() … 強制的に時刻同期

である。

奴隷リストは host 構造体(サイバーパンク歌舞伎町)型の配列 hp で管理され、最大 NHOSTS つまり 100 台までが参加できる、いや少なくねえ！？ってそりゃスケールするわけねえ、最初から LAN(Local Area Network) 向けを唄ってるわけですわ。

4.3BSD/usr/src/etc/timed/globals.h#53

#define NHOSTS		100	/* max number of hosts controlled by timed */

struct host {
char *name;
struct sockaddr_in addr;
long delta;
u_short seq;
};
...
extern struct host hp[];

4.3BSD/usr/src/etc/timed/timed.c#37

37 struct host hp[NHOSTS];

4.3BSD/usr/src/etc/timed/master.c#383

findhost(name)
char *name;
{
int i;
int ind;

ind = -1;
for (i=1; i<slvcount; i++) {
	if (strcmp(name, hp[i].name) == 0) {
		ind = i;
		break;
	}
}
return(ind);
}

/*
* 'addmach' adds a host to the list of controlled machines
* if not already there 
*/

addmach(name, addr)
char *name;
struct sockaddr_in *addr;
{
int ret;
int findhost();

ret = findhost(name);
if (ret < 0) {
	hp[slvcount].addr = *addr;
	hp[slvcount].name = (char *)malloc(MAXHOSTNAMELEN);
	(void)strcpy(hp[slvcount].name, name);
	hp[slvcount].seq = 0;
	ret = slvcount;
	if (slvcount < NHOSTS)
		slvcount++;
	else {
		syslog(LOG_ERR, "no more slots in host table");
	}
} else {
	/* need to clear sequence number anyhow */
	hp[ret].seq = 0;
}
#ifdef MEASURE
header = ON;
#endif
return(ret);
}

findhost() の実装もひどい、スレーブのホスト名の一致しか見てないから詐称するだけで別のスレーブにマスターからコマンド送り放題だと思われるが、そういう時代だったんだよ(しろめ)。

余談っぽくなるが最新版において 100 台縛りはリンクリスト化することで制限解除されたようなことを前回書いてしまった。

確かに host 構造体は hosttbl 構造体に改められて双方向リストに書き直されてはいる。しかしダイナミックアロケーションはしておらず固定長配列プールからリスト作ってるだけなんだなこれ。よって NHOSTS は 1013 に増やしたものの縛りはいまだ残っているというクソ実装であった。

usr.sbin/timed/timed/globals.h#101

#define NHOSTS		1013	/* max of hosts controlled by timed
				 * This must be a prime number.
				 */
struct hosttbl {
struct	hosttbl *h_bak;		/* hash chain */
struct	hosttbl *h_fwd;
struct  hosttbl *l_bak;		/* "sequential" list */
struct  hosttbl *l_fwd;
...
};

/* closed hash table with internal chaining */
extern struct hosttbl hosttbl[NHOSTS+1];

コメントに closed hash table とあるけどホスト名文字列のハッシュ値を配列のインデックスにするだけの手抜き実装、ホスト名はユニークだから衝突しっこないだろガハハ。

usr.sbin/timed/timed/master.c#532

struct hosttbl *			/* answer or 0 */
findhost(char *name)
{
int i, j;
struct hosttbl *htp;
char *p;

j= 0;
for (p = name, i = 0; i < 8 && *p != '\0'; i++, p++)
	j = (j << 2) ^ *p;
newhost_hash = &hosttbl[j % NHOSTS];

htp = newhost_hash;
if (htp->name[0] == '\0')
	return(0);
do {
	if (!strcmp(name, htp->name))
		return(htp);
	htp = htp->h_fwd;
} while (htp != newhost_hash);
return(0);
}

ほい、リスト要素は歯抜けの配列をイテレートするためだけのものってこった。

分散コンピューティングなんだから DHT(Distributed Hash Table) を実装しろと時代錯誤の贅沢は言わんけど、せめて赤黒木でハッシュテーブル実装しませんかね(しろめ)。まだ当時発明されてなかったりしたらゴメンと検索したらとっくにされてんじゃねーか。

存在しない過去記事も何度か紹介したがいまどきは tree(3) あるいは rbtree(3) あるからハッシュテーブルなんて秒で実装できるけど、当時はそれすらめんどくさいのが C なのだ。そりゃスケールするわけがない、おいしいですよね青魚DHA。

マスターはスレーブを管理用の配列につっこんだら最初の一回だけ TSP_SETTIME コマンドを投げてスレーブに強制時刻同期を迫る。

4.3BSD/usr/src/etc/timed/master.c#502

newslave(ind, seq)
u_short seq;
{
struct tsp to;
struct tsp *answer, *acksend();

if (trace)
	prthp();
if (seq == 0 || hp[ind].seq !=  seq) {
	hp[ind].seq = seq;
	to.tsp_type = TSP_SETTIME;
	(void)strcpy(to.tsp_name, hostname);
	/*
	 * give the upcoming slave the time
	 * to check its input queue before
	 * setting the time
	 */
	sleep(1);
	(void) gettimeofday(&to.tsp_time,
	    (struct timezone *)0);
	answer = acksend(&to, &hp[ind].addr,
	    hp[ind].name, TSP_ACK,
	    (struct netinfo *)NULL);
	if (answer == NULL) {
		syslog(LOG_WARNING,
		    "no reply to initial SETTIME from: %s",
		    hp[ind].name);
		rmmach(ind);
	}
}
}

この時だけは時刻が逆戻りする可能性がある、timed(8) が起動スクリプト rc(8) から呼ばれる時だけだしいいよね…っておおらかな時代の実装だなぁ。

スレーブ側で TSP_SETTIME をどう処理するかはそっちのコードを読む際に説明する。

その他のコマンド処理

説明する価値ないので省略！

synch() による時刻調整

いよいよ前回文章で流しただけの TEMPO による時刻調整のコードを読んでいこう。

4.3BSD/usr/src/etc/timed/master.c#502

extern int measure_delta;
...
/*
* `synch' synchronizes all the slaves by calling measure, 
* networkdelta and correct 
*/

synch(mydelta)
long mydelta;
{
int i;
int measure_status;
...
struct timeval tack;
...
	machup = 1;
	hp[0].delta = 0;
	for(i=1; i<slvcount; i++) {
		tack.tv_sec = 0;
		tack.tv_usec = 500000;
		if ((measure_status = measure(&tack, &hp[i].addr)) <0) {
			syslog(LOG_ERR, "measure: %m");
			exit(1);
		}
		hp[i].delta = measure_delta;
		if (measure_status == GOOD)
			machup++;
	}
...
			netdelta = networkdelta();
			correct(netdelta);

ポイントは以下の 3 つの関数で、ペーパーにあったポンチ絵 3 枚と対応している。

measure() による clockdiff の測定
networkdelta() による「正しい時刻」の決定
correct() による時刻調整

measure() による clockdiff の測定

自身とスレーブの時間差 clockdiff を収集する作業、最終的にグローバル変数の measure_delta に値がセットされる。

まずはICMP timestamp をスレーブに送って返してくるまでの時間、すなわちラウンドトリップタイム (RTT) の計測を行う。

4.3BSD/usr/src/etc/timed/measure.c#29

/*
* Measures the differences between machines' clocks using
* ICMP timestamp messages.
*/

measure(wait, addr)
struct timeval *wait;
struct sockaddr_in *addr;
{
...
/*
 * To measure the difference, select MSGS messages whose round-trip
 * time is smaller than RANGE if ckrange is 1, otherwise simply
 * select MSGS messages regardless of round-trip transmission time.
 * Choose the smallest transmission time in each of the two directions.
 * Use these two latter quantities to compute the delta between
 * the two clocks.
 */
...
oicp->icmp_type = ICMP_TSTAMP;
...
	(void)gettimeofday (&tv1, (struct timezone *)0);
	sendtime = oicp->icmp_otime = (tv1.tv_sec % (24*60*60)) * 1000 
						+ tv1.tv_usec / 1000;
...
	count = sendto(sock_raw, (char *)opacket, sizeof(*oicp), 0, 
			addr, sizeof(struct sockaddr_in));
...
	for (;;) {
...
		cc = recvfrom(sock_raw, (char *)packet, PACKET_IN, 0, 
		    (struct sockaddr_in *)NULL, &length);
		(void)gettimeofday(&tv1, (struct timezone *)0);
...
		icp = (struct icmp *)(packet + (ip->ip_hl << 2));
		if((icp->icmp_type == ICMP_TSTAMPREPLY) &&
		    icp->icmp_id == id && icp->icmp_seq == seqno)
			break;
	}
...
	recvtime = (tv1.tv_sec % (24*60*60)) * 1000 +
	    tv1.tv_usec / 1000;
	diff = recvtime - sendtime;
...
}

sendtime … 送信時間( sendto(2) で ICMP_TSTAMP なパケットを送信する直前)
recvtime … 受信時間( recvfrom(2) で ICMP_TSTAMPREPLY なパケットを受信した直後)
diff … ラウンドトリップタイム(受信時間から送信時間を引いたもの)

簡単ですね？ ping(8) のコードで RTT 学ぶよりコードが簡潔な分判りやすいといえる。

お次はスレーブの現在時間の取得、というかさっきの受信パケットで取得済である。

4.3BSD/usr/src/etc/timed/measure.c#132

132 		histime = ntohl((u_long)icp->icmp_rtime);

ほい RFC792 INTERNET CONTROL MESSAGE PROTOCOL でいうところの Timestamp Reply Message データグラム

Timestamp or Timestamp Reply Message

    0                   1                   2                   3
    0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1 2 3 4 5 6 7 8 9 0 1
   +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
   |     Type      |      Code     |          Checksum             |
   +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
   |           Identifier          |        Sequence Number        |
   +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
   |     Originate Timestamp                                       |
   +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
   |     Receive Timestamp                                         |
   +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+
   |     Transmit Timestamp                                        |
   +-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+-+

これの Receive Timestamp がスレーブの現在時間。ところで変数名が HisTime (彼の時間)ってやっぱ雄豚なんだなぁ…

4.3BSD/usr/src/etc/timed/globals.h#24

/*
* Parameters for network time measurement
* of each host using ICMP timestamp requests.
*/
#define RANGE		20		/* best expected round-trip time, ms */

4.3BSD/usr/src/etc/timed/measure.c#17

#define BIASP	 	43199999
#define BIASN		-43200000
#define MODULO	 	86400000
...
long sendtime, recvtime, histime;
long min1, min2, diff;
register long delta1, delta2;
...
	delta1 = histime - sendtime;
	/*
	 * Handles wrap-around to avoid that around 
	 * midnight small time differences appear 
	 * enormous. However, the two machine's clocks
	 * must be within 12 hours from each other.
	 */
	if (delta1 < BIASN)
		delta1 += MODULO;
	else if (delta1 > BIASP)
		delta1 -= MODULO;
	delta2 = recvtime - histime;
	if (delta2 < BIASN)
		delta2 += MODULO;
	else if (delta2 > BIASP)
		delta2 -= MODULO;

なにやらゴチャゴチャしてるけどまず最初に理解すべきは

delta1 = histime - sendtime … マスター → スレーブの到達時間(スレーブ現在時間 - 送信時間)
delta2 = recvtime - histime … スレーブ → マスターの到達時間(受信時間 - スレーブ現在時間)
diff = recvtime - sendtime … ラウンドトリップタイム(受信時間 - 送信時間)

のみっつ、送受信時間はマスター計測なので delta1 と delta2 にはマスターとスレーブとの時差が含まれている。

そして謎の定数みっつだけど、86400000 が 24*60*60*1000 である事に気づくと

BIASP … プラス 12 時間
BIASN … マイナス 12 時間
MODULO … 24時間

の意味だとわかる、なーにが BIAS (=偏差)と MODULO (=剰余)じゃこれだから理系は。

しかしなぜ delta1 と delta2 を前後 24 時間ずらす必要があるのか。それは再掲になるが以下の処理を思い出せ。

4.3BSD/usr/src/etc/timed/measure.c#96

	sendtime = oicp->icmp_otime = (tv1.tv_sec % (24*60*60)) * 1000 
						+ tv1.tv_usec / 1000;
...
	recvtime = (tv1.tv_sec % (24*60*60)) * 1000 +
	    tv1.tv_usec / 1000;

そう送受信「時刻」でなく「時間」なのだ、すでに 24 時間で割っちゃってるからね。よって送受信の間に日を跨いだら sendtime > recvtime と逆転してしまう。だから補正しないと正しい値にならんのだ。

ICMP timestamp の時間表現(ミリ秒)を優先してるから仕方ない面もあるがもっと判りやすいコードにならんか。

まぁいいや、お次のコード。

4.3BSD/usr/src/etc/timed/measure.c#44

long min1, min2, diff;
...
min1 = min2 = 0x7fffffff;
...
	if (delta1 < min1)  
		min1 = delta1;
	if (delta2 < min2)
		min2 = delta2;
	if (diff < RANGE) {
		min1 = delta1;
		min2 = delta2;
		break;
	}

delta1 と delta2 が 0x7fffffff より大きくなるケースが判らない。計算元となる sendtime と recvtime はソースが gettimeofday(2) だから絶対に無い。可能性があるのは ICMP timestamp がソースの histtime だけど以下のコードあるし到達不能コードだよなこれ。

4.3BSD/usr/src/etc/timed/measure.c#133

	/*
	 * a hosts using a time format different from 
	 * ms. since midnight UT (as per RFC792) should
	 * set the high order bit of the 32-bit time
	 * value it transmits.
	 */
	if ((histime & 0x80000000) != 0) {
		status = NONSTDTIME;
		break;
	}

あとは MODULO の補正でオーバーフローあるいはアンダーフロー？たった 24 時間の足し引きでそうなるなら既に値が異常だよね…

まぁいい、delta1 と delta2 が 0x7fffffff より大きい異常事態でも diff すなわちラウンドトリップタイムが RANGE つまり 20 秒以下なら採用される。仕様書通りならどうせ最後に異常値扱いで除外されるでしょう…

長かった measure() もようやくフィナーレである。

4.3BSD/usr/src/etc/timed/measure.c#20

 20 #define PROCESSING_TIME	5 	/* ms. to reduce error in measurement */
...
176 		measure_delta = (min1 - min2)/2 + PROCESSING_TIME;

ここまできたのなら実際に計算してみようかね、例題として

マスターとスレーブの時刻差は 10 秒
ラウンドトリップタイムは 2 秒

というケースを想定する。

[master]        [slave]
00:00:00        00:00:10

00:00:00  1 ->  00:00:11
00:00:02  <- 1  00:00:11

sendtime = 00:00:00
recvtime = 00:00:02
histime  = 00:00:11

diff = recvtime(00:00:02) - sendtime(00:00:00) = 2

delta1 = histime(00:00:11) - sendtime(00:00:00) = 11
delta2 = recvtime(00:00:02) - histime(00:00:11) = -9

min1 = delta1(11)
min2 = delta2(-9)

measure_delta = (min1(11) - min2(-9))/2 = 10

という計算になる、おお！ measure_delta は 10 秒で正確にマスターとスレーブの時刻差が取得できてるわけだ。

まぁ勘の良い人はもうお気づきかと思いますが、この計算ってラウンドトリップが常に対照的であるという幸せな前提に頼ってるんだよね。

最大で行きと帰りの時間差 1/2 の誤差が生じるアルゴリズムなのだ、ただしこれは NTP も同様の問題があったはずである。

最後に PROCESSING_TIME つまり 5 ミリ秒を足してるのは、measure() 自体が費やした計算時間がだいたいそれくらいというアバウトな補正である。

うーんこれマシンの性能が上がってるわけで 5 ミリ秒って現実に即してないっす誤差ふえるっす。ちゃんと測ればいいんじゃないですかね…

まぁ下手に計測すると今度は Windows 98 の NDIS.VXD 問題みたいなの起こすこともあるけど。初期化中に 100 万回空ループした時間を計測しその時間で割り算するんだが K6 以降の高速な CPU だと小数点以下なのでゼロ除算エラー起こして Windows 保護エラーになるという有名なやつ。

networkdelta() による「正しい時刻」の決定

まずはどうでもいい部分、x[NHOSTS] にすべてのスレーブの delta をコピー。

4.3BSD/usr/src/etc/timed/networkdelta.c#16

/*
* `networkdelta' selects the largest set of deltas that fall within the
* interval RANGE, and uses them to compute the network average delta 
*/

long networkdelta()
{
int i, j, maxind, minind;
...
int tempind;
long tempdata;
long x[NHOSTS];
...

for (i=0; i<slvcount; i++)
	x[i] = hp[i].delta;

その次の行からが衝撃的である。バブルソートしかも手書きって遭遇するの何年ぶりだろう(絶滅動物を発見した時の顔)。なお qsort(3) は V5 UNIX の頃から存在するしここで安定ソートが必要なわけでもないしナニコレ。

4.3BSD/usr/src/etc/timed/networkdelta.c#32

for (i=0; i<slvcount-1; i++) {
	tempdata = x[i];
	tempind = i;
	for (j=i+1; j<slvcount; j++) {
		if (x[j] < tempdata) {
			tempdata = x[j];
			tempind = j;
		}
	}
	x[tempind] = x[i];
	x[i] = tempdata;
}

お次、 DO NOT TOUCH IT! 触るんじゃねえってあるけど触りたくねえ！の間違いじゃねぇかなこれ。

4.3BSD/usr/src/etc/timed/networkdelta.c#45

/* this piece of code is critical: DO NOT TOUCH IT! */
/****/
i=0; j=1; minind=0; maxind=1;
if (machup == 2)
	goto compute;
do {
	if (x[j]-x[i] <= RANGE)
		j++;
	else {
		if (j > i+1) 
				j--; 
		if ((x[j]-x[i] <= RANGE) && (j-i >= maxind-minind)) {
			minind=i;
			maxind=j;
		}	
		i++;
		if(i = j)
			j++;
	}
} while (j < machup);
if ((x[machup-1] - x[i] <= RANGE) && (machup-i-1 >= maxind-minind)) {
	minind=i; maxind=machup-1;
}

時刻差が RANGE つまり 20 秒に収まってる範囲を探し、その範囲の開始を minind 終了を maxind としてそれ以外はバッサリ異常値と判定する。

えぇ…これ 20 秒で連続してさえいれば、もっとも時刻差の大きい集合が集計対象になってしまうがいいのかこれ。

それと if(i = j) とか明らかにバグってそうなんだが大丈夫？本当に if((i = j) != 0) こそ意図したコードなのかそれとも if(i == j) の typo なのかまるでコード理解する気にならねえ！

そんで最後に正常値と判定された集合の平均を計算しこれを「正しい時刻」として返している。

4.3BSD/usr/src/etc/timed/networkdelta.c#24

int ext;
...
long average;
...
/****/
compute:
ext = maxind - minind + 1;
average = 0;
for (i=minind; i<=maxind; i++)
	average += x[i];
average /= ext;
return(average);

小数点以下切捨てかぁ。

賢明なる読者(検索エンジンは機能不全で SNS 上の広報を拒否する当チラシの裏に読者など存在しえないわけだが)もう初見でこのコード怪しい…ってなるよね。

ご安心ください 4.4BSD の時点ですでに総ツッコみ入れられて完全にコードが書き直されています。なので上記のコードはある意味 You are not expected understand this だったのだ。

4.4BSD/usr/src/usr.sbin/timed/timed/networkdelta.c#46

/*
* Compute a corrected date.
*	Compute the median of the reasonable differences.  First compute
*	the median of all authorized differences, and then compute the
*	median of all differences that are reasonably close to the first
*	median.
*
* This differs from the original BSD implementation, which looked for
*	the largest group of machines with essentially the same date.
*	That assumed that machines with bad clocks would be uniformly
*	distributed.  Unfortunately, in real life networks, the distribution
*	of machines is not uniform among models of machines, and the
*	distribution of errors in clocks tends to be quite consistent
*	for a given model.  In other words, all model VI Supre Servres
*	from GoFast Inc. tend to have about the same error.
*	The original BSD implementation would chose the clock of the
*	most common model, and discard all others.
*
*	Therefore, get best we can do is to try to average over all
*	of the machines in the network, while discarding "obviously"
*	bad values.
*/

おお、統計学知らずによくプログラマやってんなおじさん「統計学知らずによくプログラマやってんな」が現れて中央値を使うようになっているね(ニッコリ)、そらそうよ。

まず最初に good かつ measure() で応答のあったスレーブだけで仮の中央値を計算する。

4.4BSD/usr/src/usr.sbin/timed/timed/networkdelta.c#68

long
networkdelta()
{
struct hosttbl *htp;
long med;
...
long x[NHOSTS];
long *xp;
int numdelta;
...
/*
 * compute the median of the good values
 */
med = 0;
numdelta = 1;
xp = &x[0];
*xp = 0;			/* account for ourself */
for (htp = self.l_fwd; htp != &self; htp = htp->l_fwd) {
	if (htp->good
	    && htp->noanswer == 0
	    && htp->delta != HOSTDOWN) {
		med += htp->delta;
		numdelta++;
		*++xp = htp->delta;
	}
}
...
med /= numdelta;

good とはコード引用はしないが

マスター自身
-F オプションで指定されたホスト名に一致
-G オプションで指定された netgroup(5) に属するホスト名に一致

なので後ろふたつ未指定ならマスター時刻となる。ところでお気づきかと思いますが中央値じゃなくて平均値じゃねーか！

もうツッコむのに疲れたのでいいやお次。

仮の中央値(実際は平均値)から VALID_RANGE すなわち妥当な範囲(誤差プラマイ 20 秒) 以外は異常値とし除外した集合の中央値(今度は本当)を出す。

4.4BSD/usr/src/usr.sbin/timed/timed/globals.h#72

80 #define	MAXADJ		20		/* max adjtime() correction in sec */
...
101 #define VALID_RANGE (MAXADJ*1000)	/* good times in milliseconds */

4.4BSD/usr/src/usr.sbin/timed/timed/networldelta.c#105

105 	eps = med - x[0];
...
109 	med = median(med, &eps, &x[0], xp+1, VALID_RANGE);

libm とかですらソートした結果の真ん中でいいじゃんで実装しない中央値である。それをわざわざソートせずに計算しようとする median() の実装まではもうめんどくさいので追いかけない。今度はちゃんと中央値返してくれることでしょう(願望)。

そしてお次は good なホストであれば中央値から VGOOD_RANGE すなわち 1/60 秒未満それ以外は GOOD_RANGE すなわち 1/30 秒の範囲内に収まる集合の中央値を算出する。

4.4BSD/usr/include/machine/limits.h#40

40 #define	CLK_TCK		60		/* ticks per second */

4.4BSD/usr/src/usr.sbin/timed/timed/globals.h#72

/* Best expected round trip for a measurement.
* This is essentially the number of milliseconds per CPU tick (CLK_TCK?).
* All delays shorter than this are usually reported as 0.
*/
#define MIN_ROUND ((1000-1)/CLK_TCK)
...
#define GOOD_RANGE (MIN_ROUND*2)
#define VGOOD_RANGE (MIN_ROUND-1)

4.4BSD/usr/src/usr.sbin/timed/timed/networldelta.c#111

/*
 * compute the median of all values near the good median
 */
hidelta = med + GOOD_RANGE;
lodelta = med - GOOD_RANGE;
higood = med + VGOOD_RANGE;
logood = med - VGOOD_RANGE;
xp = &x[0];
htp = &self;
do {
	if (htp->noanswer == 0
	    && htp->delta >= lodelta
	    && htp->delta <= hidelta
	    && (htp->good
		|| (htp->delta >= logood
		    && htp->delta <= higood))) {
		*xp++ = htp->delta;
	}
} while (&self != (htp = htp->l_fwd));

if (xp == &x[0]) {
...
	return med;
}

if (xp == &x[1]) {
...
	return x[0];
}
...
return median(med, &eps, &x[0], xp, 1);

ちなみに CLK_TCK はハードクロックの秒あたりのクロック数、60kHz なら 60 となる。うん HZ マクロの方は 100 返してくるんだけどなガハハ。どうして一致してないんですか？この謎はいずれ調べてみようかと思う。

measure() で適当に 5 ミリ秒とどんぶり勘定してたのよりはクロック数計算するだけマシではあるが、計算速度の進歩を前にすると誤差大きくする結果になるよねこれ。

correct() による時刻調整

まずはマスター自身の時刻調整。

プラマイ 20 秒以内なら adjtime(2) で時刻調整
それ以上なら settimeofday(2) で強制同期

と前回解説した通りである。

4.3BSD/usr/src/etc/timed/correct.c#18

/* 
* `correct' sends to the slaves the corrections for their clocks
*/

correct(avdelta)
long avdelta;
{
...
int corr;
struct timeval adjlocal;
...
corr = avdelta - hp[0].delta;
adjlocal = mstotvround(&corr);
adjclock(&adjlocal);
...
}
...
adjclock(corr)
struct timeval *corr;
{
struct timeval now;
...
	if (corr->tv_sec < MAXADJ && corr->tv_sec > - MAXADJ) {
		(void)adjtime(corr, (struct timeval *)0);
	} else {
...
		(void) gettimeofday(&now, (struct timezone *)0);
		timevaladd(&now, corr);
		if (settimeofday(&now, (struct timezone *)0) < 0)
			syslog(LOG_ERR, "can't set time");
	}
...
}

あとはスレーブに TSP_ADJTIME コマンドを投げるだけである。

4.3BSD/usr/src/etc/timed/correct.c#49

for(i=1; i<slvcount; i++) {
...
		corr = avdelta - hp[i].delta;
		msgs.tsp_time = mstotvround(&corr);
		msgs.tsp_type = (u_char)TSP_ADJTIME;
		(void)strcpy(msgs.tsp_name, hostname);
		answer = acksend(&msgs, &hp[i].addr, hp[i].name,
		    TSP_ACK, (struct netinfo *)NULL);
...
}

ほい、マスター側のソース散策はこれでおしまい。

次回

スレーブ側のコードを読んでいくよ。