Skip to content
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
33 changes: 23 additions & 10 deletions src/heartbeat.js
Original file line number Diff line number Diff line change
Expand Up @@ -24,13 +24,14 @@ class HeartbeatMonitor extends EventEmitter {
this.timestamps = {};

this.start = this.start.bind(this);
this.clearHeartbeatOnWorkerDown = this.clearHeartbeatOnWorkerDown.bind(this);
this.monitorHeartbeat = this.monitorHeartbeat.bind(this);
}

recordHeartbeat(workerId) {
const past = this.timestamps[workerId] || this.heartbeatStartedAt;
const past = this.timestamps[workerId];

if (past !== null) {
if (past != null) {
this.emit(
'info:workerHeartbeatDelta',
workerId,
Expand All @@ -40,16 +41,24 @@ class HeartbeatMonitor extends EventEmitter {
this.timestamps[workerId] = process.hrtime();
}

clearHeartbeatOnWorkerDown(workerId) {
this.timestamps[workerId] = null;
}

start() {
this.heartbeatStartedAt = process.hrtime();

this.supervisor.on('workerDown', this.clearHeartbeatOnWorkerDown);

this.monitorHeartbeat();
}

stop() {
if (this.monitorHeartbeatTimeout) {
clearTimeout(this.monitorHeartbeatTimeout);
}

this.supervisor.removeListener('workerDown', this.clearHeartbeatOnWorkerDown);
}

monitorHeartbeat() {
Expand All @@ -58,13 +67,17 @@ class HeartbeatMonitor extends EventEmitter {
}

Object.entries(this.supervisor.workers)
.filter(([, worker]) => !worker.isDead()).forEach(([workerId]) => {
const ts = this.timestamps[workerId] || this.heartbeatStartAt;
const delta = hrtimeToMilliseconds(process.hrtime(ts));

if (delta > this.stallTolerance) {
this.emit('workerStall', workerId);
this.emit('info:workerHeartbeatDelta', workerId, delta);
.filter(([, worker]) => !worker.isDead())
.filter(([, worker]) => worker.state === 'up')
.forEach(([workerId]) => {
const ts = this.timestamps[workerId];
if (ts != null) {
const delta = hrtimeToMilliseconds(process.hrtime(ts));

if (delta > this.stallTolerance) {
this.emit('workerStall', workerId);
this.emit('info:workerHeartbeatDelta', workerId, delta);
}
}
});

Expand Down Expand Up @@ -94,7 +107,7 @@ export function workerHeartbeat(worker, { workerInterval }) {

function heartbeatFn() {
if (obj.heartbeatTimeout) {
clearTimeout(this.heartbeatTimeout);
clearTimeout(obj.heartbeatTimeout);
}
worker.send({ act: 'poolHallHeartbeat' });
obj.heartbeatTimeout = setTimeout(heartbeatFn, interval);
Expand Down
48 changes: 45 additions & 3 deletions tests/heartbeat.test.js
Original file line number Diff line number Diff line change
Expand Up @@ -83,12 +83,15 @@ describe('heartbeat', () => {
});
Object.values(supervisor.workers).forEach((worker) => {
worker.emit('message', { act: 'poolHallHeartbeat' });
worker.emit('up');
worker.process.emit('message', { poolHallInternal: true, act: 'ready' });
});
});

it('reports stalled workers', (done) => {
supervisor.start();
Object.values(supervisor.workers).forEach((worker) => {
worker.state = 'up'; // eslint-disable-line no-param-reassign
Comment thread
ljharb marked this conversation as resolved.
});
const strId = Object.keys(supervisor.workers)[0];
monitor.heartbeatStartedAt = now; // timer won't be installed immediately
monitor.timestamps[strId] = [now[0] - 10, now[1]];
Expand All @@ -99,9 +102,26 @@ describe('heartbeat', () => {
monitor.monitorHeartbeat();
});

it('does not report down workers as stalled', () => {
supervisor.start();
Object.values(supervisor.workers).forEach((worker) => {
worker.state = 'down'; // eslint-disable-line no-param-reassign
});
const strId = Object.keys(supervisor.workers)[0];
monitor.heartbeatStartedAt = now; // timer won't be installed immediately
monitor.timestamps[strId] = [now[0] - 10, now[1]];
Comment thread
ljharb marked this conversation as resolved.
monitor.once('workerStall', () => {
assert.fail();
});
monitor.monitorHeartbeat();
});

it('does not report workers not stalled', () => {
supervisor.start();
monitor.heartbeatStartedAt = now;
Object.values(supervisor.workers).forEach((worker) => {
worker.state = 'up'; // eslint-disable-line no-param-reassign
});
Object.keys(supervisor.workers)
.forEach((strId) => {
monitor.timestamps[strId] = now;
Expand All @@ -128,7 +148,7 @@ describe('heartbeat', () => {

Object.values(supervisor.workers).forEach((worker) => {
worker.emit('message', { act: 'poolHallHeartbeat' });
worker.emit('up');
worker.process.emit('message', { poolHallInternal: true, act: 'ready' });
});
setImmediate(jest.runOnlyPendingTimers);
});
Expand All @@ -139,12 +159,34 @@ describe('heartbeat', () => {
monitor.once('info:workerHeartbeatDelta', () => done());
Object.values(supervisor.workers).forEach((worker) => {
worker.emit('message', { act: 'poolHallHeartbeat' });
worker.emit('up');
worker.process.emit('message', { poolHallInternal: true, act: 'ready' });
});
Object.values(supervisor.workers).forEach((worker) => {
worker.emit('message', { act: 'poolHallHeartbeat' });
});
});

it('clears heartbeat timestamp on workerDown', () => {
supervisor.start();
monitor.start();

Object.values(supervisor.workers).forEach((worker) => {
worker.emit('message', { act: 'poolHallHeartbeat' });
worker.process.emit('message', { poolHallInternal: true, act: 'ready' });
});

Object.keys(supervisor.workers).forEach((workerId) => {
assert(monitor.timestamps[workerId] != null);
});

Object.values(supervisor.workers).forEach((worker) => {
worker.emit('down');
});

Object.keys(supervisor.workers).forEach((workerId) => {
assert.equal(monitor.timestamps[workerId], null);
});
});
});
});
});