upstream/ipython Commit - r10079:fa8f1e1d

1

"""The Python scheduler for rich scheduling.

1

"""The Python scheduler for rich scheduling.

2

3

The Pure ZMQ scheduler does not allow routing schemes other than LRU,

3

The Pure ZMQ scheduler does not allow routing schemes other than LRU,

4

nor does it check msg_id DAG dependencies. For those, a slightly slower

4

nor does it check msg_id DAG dependencies. For those, a slightly slower

5

Python Scheduler exists.

5

Python Scheduler exists.

6

7

Authors:

7

Authors:

8

9

* Min RK

9

* Min RK

10

"""

10

"""

11

#-----------------------------------------------------------------------------

11

#-----------------------------------------------------------------------------

12

13

#

13

#

14

# Distributed under the terms of the BSD License. The full license is in

14

# Distributed under the terms of the BSD License. The full license is in

15

# the file COPYING, distributed as part of this software.

15

# the file COPYING, distributed as part of this software.

16

#-----------------------------------------------------------------------------

16

#-----------------------------------------------------------------------------

17

18

#----------------------------------------------------------------------

18

#----------------------------------------------------------------------

19

# Imports

19

# Imports

20

#----------------------------------------------------------------------

20

#----------------------------------------------------------------------

21

22

import heapq

23

import logging

22

import logging

24

import sys

23

import sys

25

import time

24

import time

26

25

27

from datetime import datetime, timedelta

26

from collections import deque

27

from datetime import datetime

28

from random import randint, random

28

from random import randint, random

29

from types import FunctionType

29

from types import FunctionType

30

31

try:

31

try:

32

import numpy

32

import numpy

33

except ImportError:

33

except ImportError:

34

numpy = None

34

numpy = None

35

36

import zmq

36

import zmq

37

from zmq.eventloop import ioloop, zmqstream

37

from zmq.eventloop import ioloop, zmqstream

38

39

# local imports

39

# local imports

40

from IPython.external.decorator import decorator

40

from IPython.external.decorator import decorator

41

from IPython.config.application import Application

41

from IPython.config.application import Application

42

from IPython.config.loader import Config

42

from IPython.config.loader import Config

43

from IPython.utils.traitlets import Instance, Dict, List, Set, Integer, Enum, CBytes

43

from IPython.utils.traitlets import Instance, Dict, List, Set, Integer, Enum, CBytes

44

from IPython.utils.py3compat import cast_bytes

44

from IPython.utils.py3compat import cast_bytes

45

46

from IPython.parallel import error, util

46

from IPython.parallel import error, util

47

from IPython.parallel.factory import SessionFactory

47

from IPython.parallel.factory import SessionFactory

48

from IPython.parallel.util import connect_logger, local_logger

48

from IPython.parallel.util import connect_logger, local_logger

49

50

from .dependency import Dependency

50

from .dependency import Dependency

51

52

@decorator

52

@decorator

53

def logged(f,self,*args,**kwargs):

53

def logged(f,self,*args,**kwargs):

54

# print ("#--------------------")

54

# print ("#--------------------")

55

self.log.debug("scheduler::%s(*%s,**%s)", f.func_name, args, kwargs)

55

self.log.debug("scheduler::%s(*%s,**%s)", f.func_name, args, kwargs)

56

# print ("#--")

56

# print ("#--")

57

return f(self,*args, **kwargs)

57

return f(self,*args, **kwargs)

58

59

#----------------------------------------------------------------------

59

#----------------------------------------------------------------------

60

# Chooser functions

60

# Chooser functions

61

#----------------------------------------------------------------------

61

#----------------------------------------------------------------------

62

63

def plainrandom(loads):

63

def plainrandom(loads):

64

"""Plain random pick."""

64

"""Plain random pick."""

65

n = len(loads)

65

n = len(loads)

66

return randint(0,n-1)

66

return randint(0,n-1)

67

68

def lru(loads):

68

def lru(loads):

69

"""Always pick the front of the line.

69

"""Always pick the front of the line.

70

71

The content of `loads` is ignored.

71

The content of `loads` is ignored.

72

73

Assumes LRU ordering of loads, with oldest first.

73

Assumes LRU ordering of loads, with oldest first.

74

"""

74

"""

75

return 0

75

return 0

76

77

def twobin(loads):

77

def twobin(loads):

78

"""Pick two at random, use the LRU of the two.

78

"""Pick two at random, use the LRU of the two.

79

80

The content of loads is ignored.

80

The content of loads is ignored.

81

82

Assumes LRU ordering of loads, with oldest first.

82

Assumes LRU ordering of loads, with oldest first.

83

"""

83

"""

84

n = len(loads)

84

n = len(loads)

85

a = randint(0,n-1)

85

a = randint(0,n-1)

86

b = randint(0,n-1)

86

b = randint(0,n-1)

87

return min(a,b)

87

return min(a,b)

88

89

def weighted(loads):

89

def weighted(loads):

90

"""Pick two at random using inverse load as weight.

90

"""Pick two at random using inverse load as weight.

91

92

Return the less loaded of the two.

92

Return the less loaded of the two.

93

"""

93

"""

94

# weight 0 a million times more than 1:

94

# weight 0 a million times more than 1:

95

weights = 1./(1e-6+numpy.array(loads))

95

weights = 1./(1e-6+numpy.array(loads))

96

sums = weights.cumsum()

96

sums = weights.cumsum()

97

t = sums[-1]

97

t = sums[-1]

98

x = random()*t

98

x = random()*t

99

y = random()*t

99

y = random()*t

100

idx = 0

100

idx = 0

101

idy = 0

101

idy = 0

102

while sums[idx] < x:

102

while sums[idx] < x:

103

idx += 1

103

idx += 1

104

while sums[idy] < y:

104

while sums[idy] < y:

105

idy += 1

105

idy += 1

106

if weights[idy] > weights[idx]:

106

if weights[idy] > weights[idx]:

107

return idy

107

return idy

108

else:

108

else:

109

return idx

109

return idx

110

111

def leastload(loads):

111

def leastload(loads):

112

"""Always choose the lowest load.

112

"""Always choose the lowest load.

113

114

If the lowest load occurs more than once, the first

114

If the lowest load occurs more than once, the first

115

occurance will be used. If loads has LRU ordering, this means

115

occurance will be used. If loads has LRU ordering, this means

116

the LRU of those with the lowest load is chosen.

116

the LRU of those with the lowest load is chosen.

117

"""

117

"""

118

return loads.index(min(loads))

118

return loads.index(min(loads))

119

120

#---------------------------------------------------------------------

120

#---------------------------------------------------------------------

121

# Classes

121

# Classes

122

#---------------------------------------------------------------------

122

#---------------------------------------------------------------------

123

124

125

# store empty default dependency:

125

# store empty default dependency:

126

MET = Dependency([])

126

MET = Dependency([])

127

128

129

class Job(object):

129

class Job(object):

130

"""Simple container for a job"""

130

"""Simple container for a job"""

131

def __init__(self, msg_id, raw_msg, idents, msg, header, metadata,

131

def __init__(self, msg_id, raw_msg, idents, msg, header, metadata,

132

targets, after, follow, timeout):

132

targets, after, follow, timeout):

133

self.msg_id = msg_id

133

self.msg_id = msg_id

134

self.raw_msg = raw_msg

134

self.raw_msg = raw_msg

135

self.idents = idents

135

self.idents = idents

136

self.msg = msg

136

self.msg = msg

137

self.header = header

137

self.header = header

138

self.metadata = metadata

138

self.metadata = metadata

139

self.targets = targets

139

self.targets = targets

140

self.after = after

140

self.after = after

141

self.follow = follow

141

self.follow = follow

142

self.timeout = timeout

142

self.timeout = timeout

143

self.removed = False # used for lazy-delete ~~in heap-~~sorted queue

143

self.removed = False # used for lazy-delete from sorted queue

144

145

self.timestamp = time.time()

145

self.timestamp = time.time()

146

self.blacklist = set()

146

self.blacklist = set()

147

148

def __lt__(self, other):

148

def __lt__(self, other):

149

return self.timestamp < other.timestamp

149

return self.timestamp < other.timestamp

150

151

def __cmp__(self, other):

151

def __cmp__(self, other):

152

return cmp(self.timestamp, other.timestamp)

152

return cmp(self.timestamp, other.timestamp)

153

154

@property

154

@property

155

def dependents(self):

155

def dependents(self):

156

return self.follow.union(self.after)

156

return self.follow.union(self.after)

157

158

class TaskScheduler(SessionFactory):

158

class TaskScheduler(SessionFactory):

159

"""Python TaskScheduler object.

159

"""Python TaskScheduler object.

160

161

This is the simplest object that supports msg_id based

161

This is the simplest object that supports msg_id based

162

DAG dependencies. *Only* task msg_ids are checked, not

162

DAG dependencies. *Only* task msg_ids are checked, not

163

msg_ids of jobs submitted via the MUX queue.

163

msg_ids of jobs submitted via the MUX queue.

164

165

"""

165

"""

166

167

hwm = Integer(1, config=True,

167

hwm = Integer(1, config=True,

168

help="""specify the High Water Mark (HWM) for the downstream

168

help="""specify the High Water Mark (HWM) for the downstream

169

socket in the Task scheduler. This is the maximum number

169

socket in the Task scheduler. This is the maximum number

170

of allowed outstanding tasks on each engine.

170

of allowed outstanding tasks on each engine.

171

172

The default (1) means that only one task can be outstanding on each

172

The default (1) means that only one task can be outstanding on each

173

engine. Setting TaskScheduler.hwm=0 means there is no limit, and the

173

engine. Setting TaskScheduler.hwm=0 means there is no limit, and the

174

engines continue to be assigned tasks while they are working,

174

engines continue to be assigned tasks while they are working,

175

effectively hiding network latency behind computation, but can result

175

effectively hiding network latency behind computation, but can result

176

in an imbalance of work when submitting many heterogenous tasks all at

176

in an imbalance of work when submitting many heterogenous tasks all at

177

once. Any positive value greater than one is a compromise between the

177

once. Any positive value greater than one is a compromise between the

178

two.

178

two.

179

180

"""

180

"""

181

)

181

)

182

scheme_name = Enum(('leastload', 'pure', 'lru', 'plainrandom', 'weighted', 'twobin'),

182

scheme_name = Enum(('leastload', 'pure', 'lru', 'plainrandom', 'weighted', 'twobin'),

183

'leastload', config=True, allow_none=False,

183

'leastload', config=True, allow_none=False,

184

help="""select the task scheduler scheme [default: Python LRU]

184

help="""select the task scheduler scheme [default: Python LRU]

185

Options are: 'pure', 'lru', 'plainrandom', 'weighted', 'twobin','leastload'"""

185

Options are: 'pure', 'lru', 'plainrandom', 'weighted', 'twobin','leastload'"""

186

)

186

)

187

def _scheme_name_changed(self, old, new):

187

def _scheme_name_changed(self, old, new):

188

self.log.debug("Using scheme %r"%new)

188

self.log.debug("Using scheme %r"%new)

189

self.scheme = globals()[new]

189

self.scheme = globals()[new]

190

191

# input arguments:

191

# input arguments:

192

scheme = Instance(FunctionType) # function for determining the destination

192

scheme = Instance(FunctionType) # function for determining the destination

193

def _scheme_default(self):

193

def _scheme_default(self):

194

return leastload

194

return leastload

195

client_stream = Instance(zmqstream.ZMQStream) # client-facing stream

195

client_stream = Instance(zmqstream.ZMQStream) # client-facing stream

196

engine_stream = Instance(zmqstream.ZMQStream) # engine-facing stream

196

engine_stream = Instance(zmqstream.ZMQStream) # engine-facing stream

197

notifier_stream = Instance(zmqstream.ZMQStream) # hub-facing sub stream

197

notifier_stream = Instance(zmqstream.ZMQStream) # hub-facing sub stream

198

mon_stream = Instance(zmqstream.ZMQStream) # hub-facing pub stream

198

mon_stream = Instance(zmqstream.ZMQStream) # hub-facing pub stream

199

query_stream = Instance(zmqstream.ZMQStream) # hub-facing DEALER stream

199

query_stream = Instance(zmqstream.ZMQStream) # hub-facing DEALER stream

200

201

# internals:

201

# internals:

202

queue = ~~List~~() # ~~heap-~~sorted list of Jobs

202

queue = Instance(deque) # sorted list of Jobs

203

def _queue_default(self):

204

return deque()

203

queue_map = Dict() # dict by msg_id of Jobs (for O(1) access to the Queue)

205

queue_map = Dict() # dict by msg_id of Jobs (for O(1) access to the Queue)

204

graph = Dict() # dict by msg_id of [ msg_ids that depend on key ]

206

graph = Dict() # dict by msg_id of [ msg_ids that depend on key ]

205

retries = Dict() # dict by msg_id of retries remaining (non-neg ints)

207

retries = Dict() # dict by msg_id of retries remaining (non-neg ints)

206

# waiting = List() # list of msg_ids ready to run, but haven't due to HWM

208

# waiting = List() # list of msg_ids ready to run, but haven't due to HWM

207

pending = Dict() # dict by engine_uuid of submitted tasks

209

pending = Dict() # dict by engine_uuid of submitted tasks

208

completed = Dict() # dict by engine_uuid of completed tasks

210

completed = Dict() # dict by engine_uuid of completed tasks

209

failed = Dict() # dict by engine_uuid of failed tasks

211

failed = Dict() # dict by engine_uuid of failed tasks

210

destinations = Dict() # dict by msg_id of engine_uuids where jobs ran (reverse of completed+failed)

212

destinations = Dict() # dict by msg_id of engine_uuids where jobs ran (reverse of completed+failed)

211

clients = Dict() # dict by msg_id for who submitted the task

213

clients = Dict() # dict by msg_id for who submitted the task

212

targets = List() # list of target IDENTs

214

targets = List() # list of target IDENTs

213

loads = List() # list of engine loads

215

loads = List() # list of engine loads

214

# full = Set() # set of IDENTs that have HWM outstanding tasks

216

# full = Set() # set of IDENTs that have HWM outstanding tasks

215

all_completed = Set() # set of all completed tasks

217

all_completed = Set() # set of all completed tasks

216

all_failed = Set() # set of all failed tasks

218

all_failed = Set() # set of all failed tasks

217

all_done = Set() # set of all finished tasks=union(completed,failed)

219

all_done = Set() # set of all finished tasks=union(completed,failed)

218

all_ids = Set() # set of all submitted task IDs

220

all_ids = Set() # set of all submitted task IDs

219

221

220

ident = CBytes() # ZMQ identity. This should just be self.session.session

222

ident = CBytes() # ZMQ identity. This should just be self.session.session

221

# but ensure Bytes

223

# but ensure Bytes

222

def _ident_default(self):

224

def _ident_default(self):

223

return self.session.bsession

225

return self.session.bsession

224

226

225

def start(self):

227

def start(self):

226

self.query_stream.on_recv(self.dispatch_query_reply)

228

self.query_stream.on_recv(self.dispatch_query_reply)

227

self.session.send(self.query_stream, "connection_request", {})

229

self.session.send(self.query_stream, "connection_request", {})

228

230

229

self.engine_stream.on_recv(self.dispatch_result, copy=False)

231

self.engine_stream.on_recv(self.dispatch_result, copy=False)

230

self.client_stream.on_recv(self.dispatch_submission, copy=False)

232

self.client_stream.on_recv(self.dispatch_submission, copy=False)

231

233

232

self._notification_handlers = dict(

234

self._notification_handlers = dict(

233

registration_notification = self._register_engine,

235

registration_notification = self._register_engine,

234

unregistration_notification = self._unregister_engine

236

unregistration_notification = self._unregister_engine

235

)

237

)

236

self.notifier_stream.on_recv(self.dispatch_notification)

238

self.notifier_stream.on_recv(self.dispatch_notification)

237

self.log.info("Scheduler started [%s]" % self.scheme_name)

239

self.log.info("Scheduler started [%s]" % self.scheme_name)

238

240

239

def resume_receiving(self):

241

def resume_receiving(self):

240

"""Resume accepting jobs."""

242

"""Resume accepting jobs."""

241

self.client_stream.on_recv(self.dispatch_submission, copy=False)

243

self.client_stream.on_recv(self.dispatch_submission, copy=False)

242

244

243

def stop_receiving(self):

245

def stop_receiving(self):

244

"""Stop accepting jobs while there are no engines.

246

"""Stop accepting jobs while there are no engines.

245

Leave them in the ZMQ queue."""

247

Leave them in the ZMQ queue."""

246

self.client_stream.on_recv(None)

248

self.client_stream.on_recv(None)

247

249

248

#-----------------------------------------------------------------------

250

#-----------------------------------------------------------------------

249

# [Un]Registration Handling

251

# [Un]Registration Handling

250

#-----------------------------------------------------------------------

252

#-----------------------------------------------------------------------

251

253

252

254

253

def dispatch_query_reply(self, msg):

255

def dispatch_query_reply(self, msg):

254

"""handle reply to our initial connection request"""

256

"""handle reply to our initial connection request"""

255

try:

257

try:

256

idents,msg = self.session.feed_identities(msg)

258

idents,msg = self.session.feed_identities(msg)

257

except ValueError:

259

except ValueError:

258

self.log.warn("task::Invalid Message: %r",msg)

260

self.log.warn("task::Invalid Message: %r",msg)

259

return

261

return

260

try:

262

try:

261

msg = self.session.unserialize(msg)

263

msg = self.session.unserialize(msg)

262

except ValueError:

264

except ValueError:

263

self.log.warn("task::Unauthorized message from: %r"%idents)

265

self.log.warn("task::Unauthorized message from: %r"%idents)

264

return

266

return

265

267

266

content = msg['content']

268

content = msg['content']

267

for uuid in content.get('engines', {}).values():

269

for uuid in content.get('engines', {}).values():

268

self._register_engine(cast_bytes(uuid))

270

self._register_engine(cast_bytes(uuid))

269

271

270

272

271

@util.log_errors

273

@util.log_errors

272

def dispatch_notification(self, msg):

274

def dispatch_notification(self, msg):

273

"""dispatch register/unregister events."""

275

"""dispatch register/unregister events."""

274

try:

276

try:

275

idents,msg = self.session.feed_identities(msg)

277

idents,msg = self.session.feed_identities(msg)

276

except ValueError:

278

except ValueError:

277

self.log.warn("task::Invalid Message: %r",msg)

279

self.log.warn("task::Invalid Message: %r",msg)

278

return

280

return

279

try:

281

try:

280

msg = self.session.unserialize(msg)

282

msg = self.session.unserialize(msg)

281

except ValueError:

283

except ValueError:

282

self.log.warn("task::Unauthorized message from: %r"%idents)

284

self.log.warn("task::Unauthorized message from: %r"%idents)

283

return

285

return

284

286

285

msg_type = msg['header']['msg_type']

287

msg_type = msg['header']['msg_type']

286

288

287

handler = self._notification_handlers.get(msg_type, None)

289

handler = self._notification_handlers.get(msg_type, None)

288

if handler is None:

290

if handler is None:

289

self.log.error("Unhandled message type: %r"%msg_type)

291

self.log.error("Unhandled message type: %r"%msg_type)

290

else:

292

else:

291

try:

293

try:

292

handler(cast_bytes(msg['content']['uuid']))

294

handler(cast_bytes(msg['content']['uuid']))

293

except Exception:

295

except Exception:

294

self.log.error("task::Invalid notification msg: %r", msg, exc_info=True)

296

self.log.error("task::Invalid notification msg: %r", msg, exc_info=True)

295

297

296

def _register_engine(self, uid):

298

def _register_engine(self, uid):

297

"""New engine with ident `uid` became available."""

299

"""New engine with ident `uid` became available."""

298

# head of the line:

300

# head of the line:

299

self.targets.insert(0,uid)

301

self.targets.insert(0,uid)

300

self.loads.insert(0,0)

302

self.loads.insert(0,0)

301

303

302

# initialize sets

304

# initialize sets

303

self.completed[uid] = set()

305

self.completed[uid] = set()

304

self.failed[uid] = set()

306

self.failed[uid] = set()

305

self.pending[uid] = {}

307

self.pending[uid] = {}

306

308

307

# rescan the graph:

309

# rescan the graph:

308

self.update_graph(None)

310

self.update_graph(None)

309

311

310

def _unregister_engine(self, uid):

312

def _unregister_engine(self, uid):

311

"""Existing engine with ident `uid` became unavailable."""

313

"""Existing engine with ident `uid` became unavailable."""

312

if len(self.targets) == 1:

314

if len(self.targets) == 1:

313

# this was our only engine

315

# this was our only engine

314

pass

316

pass

315

317

316

# handle any potentially finished tasks:

318

# handle any potentially finished tasks:

317

self.engine_stream.flush()

319

self.engine_stream.flush()

318

320

319

# don't pop destinations, because they might be used later

321

# don't pop destinations, because they might be used later

320

# map(self.destinations.pop, self.completed.pop(uid))

322

# map(self.destinations.pop, self.completed.pop(uid))

321

# map(self.destinations.pop, self.failed.pop(uid))

323

# map(self.destinations.pop, self.failed.pop(uid))

322

324

323

# prevent this engine from receiving work

325

# prevent this engine from receiving work

324

idx = self.targets.index(uid)

326

idx = self.targets.index(uid)

325

self.targets.pop(idx)

327

self.targets.pop(idx)

326

self.loads.pop(idx)

328

self.loads.pop(idx)

327

329

328

# wait 5 seconds before cleaning up pending jobs, since the results might

330

# wait 5 seconds before cleaning up pending jobs, since the results might

329

# still be incoming

331

# still be incoming

330

if self.pending[uid]:

332

if self.pending[uid]:

331

dc = ioloop.DelayedCallback(lambda : self.handle_stranded_tasks(uid), 5000, self.loop)

333

dc = ioloop.DelayedCallback(lambda : self.handle_stranded_tasks(uid), 5000, self.loop)

332

dc.start()

334

dc.start()

333

else:

335

else:

334

self.completed.pop(uid)

336

self.completed.pop(uid)

335

self.failed.pop(uid)

337

self.failed.pop(uid)

336

338

337

339

338

def handle_stranded_tasks(self, engine):

340

def handle_stranded_tasks(self, engine):

339

"""Deal with jobs resident in an engine that died."""

341

"""Deal with jobs resident in an engine that died."""

340

lost = self.pending[engine]

342

lost = self.pending[engine]

341

for msg_id in lost.keys():

343

for msg_id in lost.keys():

342

if msg_id not in self.pending[engine]:

344

if msg_id not in self.pending[engine]:

343

# prevent double-handling of messages

345

# prevent double-handling of messages

344

continue

346

continue

345

347

346

raw_msg = lost[msg_id].raw_msg

348

raw_msg = lost[msg_id].raw_msg

347

idents,msg = self.session.feed_identities(raw_msg, copy=False)

349

idents,msg = self.session.feed_identities(raw_msg, copy=False)

348

parent = self.session.unpack(msg[1].bytes)

350

parent = self.session.unpack(msg[1].bytes)

349

idents = [engine, idents[0]]

351

idents = [engine, idents[0]]

350

352

351

# build fake error reply

353

# build fake error reply

352

try:

354

try:

353

raise error.EngineError("Engine %r died while running task %r"%(engine, msg_id))

355

raise error.EngineError("Engine %r died while running task %r"%(engine, msg_id))

354

except:

356

except:

355

content = error.wrap_exception()

357

content = error.wrap_exception()

356

# build fake metadata

358

# build fake metadata

357

md = dict(

359

md = dict(

358

status=u'error',

360

status=u'error',

359

engine=engine,

361

engine=engine,

360

date=datetime.now(),

362

date=datetime.now(),

361

)

363

)

362

msg = self.session.msg('apply_reply', content, parent=parent, metadata=md)

364

msg = self.session.msg('apply_reply', content, parent=parent, metadata=md)

363

raw_reply = map(zmq.Message, self.session.serialize(msg, ident=idents))

365

raw_reply = map(zmq.Message, self.session.serialize(msg, ident=idents))

364

# and dispatch it

366

# and dispatch it

365

self.dispatch_result(raw_reply)

367

self.dispatch_result(raw_reply)

366

368

367

# finally scrub completed/failed lists

369

# finally scrub completed/failed lists

368

self.completed.pop(engine)

370

self.completed.pop(engine)

369

self.failed.pop(engine)

371

self.failed.pop(engine)

370

372

371

373

372

#-----------------------------------------------------------------------

374

#-----------------------------------------------------------------------

373

# Job Submission

375

# Job Submission

374

#-----------------------------------------------------------------------

376

#-----------------------------------------------------------------------

375

377

376

378

377

@util.log_errors

379

@util.log_errors

378

def dispatch_submission(self, raw_msg):

380

def dispatch_submission(self, raw_msg):

379

"""Dispatch job submission to appropriate handlers."""

381

"""Dispatch job submission to appropriate handlers."""

380

# ensure targets up to date:

382

# ensure targets up to date:

381

self.notifier_stream.flush()

383

self.notifier_stream.flush()

382

try:

384

try:

383

idents, msg = self.session.feed_identities(raw_msg, copy=False)

385

idents, msg = self.session.feed_identities(raw_msg, copy=False)

384

msg = self.session.unserialize(msg, content=False, copy=False)

386

msg = self.session.unserialize(msg, content=False, copy=False)

385

except Exception:

387

except Exception:

386

self.log.error("task::Invaid task msg: %r"%raw_msg, exc_info=True)

388

self.log.error("task::Invaid task msg: %r"%raw_msg, exc_info=True)

387

return

389

return

388

390

389

391

390

# send to monitor

392

# send to monitor

391

self.mon_stream.send_multipart([b'intask']+raw_msg, copy=False)

393

self.mon_stream.send_multipart([b'intask']+raw_msg, copy=False)

392

394

393

header = msg['header']

395

header = msg['header']

394

md = msg['metadata']

396

md = msg['metadata']

395

msg_id = header['msg_id']

397

msg_id = header['msg_id']

396

self.all_ids.add(msg_id)

398

self.all_ids.add(msg_id)

397

399

398

# get targets as a set of bytes objects

400

# get targets as a set of bytes objects

399

# from a list of unicode objects

401

# from a list of unicode objects

400

targets = md.get('targets', [])

402

targets = md.get('targets', [])

401

targets = map(cast_bytes, targets)

403

targets = map(cast_bytes, targets)

402

targets = set(targets)

404

targets = set(targets)

403

405

404

retries = md.get('retries', 0)

406

retries = md.get('retries', 0)

405

self.retries[msg_id] = retries

407

self.retries[msg_id] = retries

406

408

407

# time dependencies

409

# time dependencies

408

after = md.get('after', None)

410

after = md.get('after', None)

409

if after:

411

if after:

410

after = Dependency(after)

412

after = Dependency(after)

411

if after.all:

413

if after.all:

412

if after.success:

414

if after.success:

413

after = Dependency(after.difference(self.all_completed),

415

after = Dependency(after.difference(self.all_completed),

414

success=after.success,

416

success=after.success,

415

failure=after.failure,

417

failure=after.failure,

416

all=after.all,

418

all=after.all,

417

)

419

)

418

if after.failure:

420

if after.failure:

419

after = Dependency(after.difference(self.all_failed),

421

after = Dependency(after.difference(self.all_failed),

420

success=after.success,

422

success=after.success,

421

failure=after.failure,

423

failure=after.failure,

422

all=after.all,

424

all=after.all,

423

)

425

)

424

if after.check(self.all_completed, self.all_failed):

426

if after.check(self.all_completed, self.all_failed):

425

# recast as empty set, if `after` already met,

427

# recast as empty set, if `after` already met,

426

# to prevent unnecessary set comparisons

428

# to prevent unnecessary set comparisons

427

after = MET

429

after = MET

428

else:

430

else:

429

after = MET

431

after = MET

430

432

431

# location dependencies

433

# location dependencies

432

follow = Dependency(md.get('follow', []))

434

follow = Dependency(md.get('follow', []))

433

435

434

# turn timeouts into datetime objects:

436

# turn timeouts into datetime objects:

435

timeout = md.get('timeout', None)

437

timeout = md.get('timeout', None)

436

if timeout:

438

if timeout:

437

timeout = time.time() + float(timeout)

439

timeout = time.time() + float(timeout)

438

440

439

job = Job(msg_id=msg_id, raw_msg=raw_msg, idents=idents, msg=msg,

441

job = Job(msg_id=msg_id, raw_msg=raw_msg, idents=idents, msg=msg,

440

header=header, targets=targets, after=after, follow=follow,

442

header=header, targets=targets, after=after, follow=follow,

441

timeout=timeout, metadata=md,

443

timeout=timeout, metadata=md,

442

)

444

)

443

if timeout:

445

if timeout:

444

# schedule timeout callback

446

# schedule timeout callback

445

self.loop.add_timeout(timeout, lambda : self.job_timeout(job))

447

self.loop.add_timeout(timeout, lambda : self.job_timeout(job))

446

448

447

# validate and reduce dependencies:

449

# validate and reduce dependencies:

448

for dep in after,follow:

450

for dep in after,follow:

449

if not dep: # empty dependency

451

if not dep: # empty dependency

450

continue

452

continue

451

# check valid:

453

# check valid:

452

if msg_id in dep or dep.difference(self.all_ids):

454

if msg_id in dep or dep.difference(self.all_ids):

453

self.queue_map[msg_id] = job

455

self.queue_map[msg_id] = job

454

return self.fail_unreachable(msg_id, error.InvalidDependency)

456

return self.fail_unreachable(msg_id, error.InvalidDependency)

455

# check if unreachable:

457

# check if unreachable:

456

if dep.unreachable(self.all_completed, self.all_failed):

458

if dep.unreachable(self.all_completed, self.all_failed):

457

self.queue_map[msg_id] = job

459

self.queue_map[msg_id] = job

458

return self.fail_unreachable(msg_id)

460

return self.fail_unreachable(msg_id)

459

461

460

if after.check(self.all_completed, self.all_failed):

462

if after.check(self.all_completed, self.all_failed):

461

# time deps already met, try to run

463

# time deps already met, try to run

462

if not self.maybe_run(job):

464

if not self.maybe_run(job):

463

# can't run yet

465

# can't run yet

464

if msg_id not in self.all_failed:

466

if msg_id not in self.all_failed:

465

# could have failed as unreachable

467

# could have failed as unreachable

466

self.save_unmet(job)

468

self.save_unmet(job)

467

else:

469

else:

468

self.save_unmet(job)

470

self.save_unmet(job)

469

471

470

def job_timeout(self, job):

472

def job_timeout(self, job):

471

"""callback for a job's timeout.

473

"""callback for a job's timeout.

472

474

473

The job may or may not have been run at this point.

475

The job may or may not have been run at this point.

474

"""

476

"""

475

if ~~job~~.~~timeout~~ >= (time.time() + 1):

477

now = time.time()

478

if job.timeout >= (now + 1):

476

self.log.warn("task %s timeout fired prematurely: %s > %s",

479

self.log.warn("task %s timeout fired prematurely: %s > %s",

477

job.msg_id, job.timeout, now

480

job.msg_id, job.timeout, now

478

)

481

)

479

if job.msg_id in self.queue_map:

482

if job.msg_id in self.queue_map:

480

# still waiting, but ran out of time

483

# still waiting, but ran out of time

481

self.log.info("task %r timed out", job.msg_id)

484

self.log.info("task %r timed out", job.msg_id)

482

self.fail_unreachable(job.msg_id, error.TaskTimeout)

485

self.fail_unreachable(job.msg_id, error.TaskTimeout)

483

486

484

def fail_unreachable(self, msg_id, why=error.ImpossibleDependency):

487

def fail_unreachable(self, msg_id, why=error.ImpossibleDependency):

485

"""a task has become unreachable, send a reply with an ImpossibleDependency

488

"""a task has become unreachable, send a reply with an ImpossibleDependency

486

error."""

489

error."""

487

if msg_id not in self.queue_map:

490

if msg_id not in self.queue_map:

488

self.log.error("task %r already failed!", msg_id)

491

self.log.error("task %r already failed!", msg_id)

489

return

492

return

490

job = self.queue_map.pop(msg_id)

493

job = self.queue_map.pop(msg_id)

491

# lazy-delete from the queue

494

# lazy-delete from the queue

492

job.removed = True

495

job.removed = True

493

for mid in job.dependents:

496

for mid in job.dependents:

494

if mid in self.graph:

497

if mid in self.graph:

495

self.graph[mid].remove(msg_id)

498

self.graph[mid].remove(msg_id)

496

499

497

try:

500

try:

498

raise why()

501

raise why()

499

except:

502

except:

500

content = error.wrap_exception()

503

content = error.wrap_exception()

501

self.log.debug("task %r failing as unreachable with: %s", msg_id, content['ename'])

504

self.log.debug("task %r failing as unreachable with: %s", msg_id, content['ename'])

502

505

503

self.all_done.add(msg_id)

506

self.all_done.add(msg_id)

504

self.all_failed.add(msg_id)

507

self.all_failed.add(msg_id)

505

508

506

msg = self.session.send(self.client_stream, 'apply_reply', content,

509

msg = self.session.send(self.client_stream, 'apply_reply', content,

507

parent=job.header, ident=job.idents)

510

parent=job.header, ident=job.idents)

508

self.session.send(self.mon_stream, msg, ident=[b'outtask']+job.idents)

511

self.session.send(self.mon_stream, msg, ident=[b'outtask']+job.idents)

509

512

510

self.update_graph(msg_id, success=False)

513

self.update_graph(msg_id, success=False)

511

514

512

def available_engines(self):

515

def available_engines(self):

513

"""return a list of available engine indices based on HWM"""

516

"""return a list of available engine indices based on HWM"""

514

if not self.hwm:

517

if not self.hwm:

515

return range(len(self.targets))

518

return range(len(self.targets))

516

available = []

519

available = []

517

for idx in range(len(self.targets)):

520

for idx in range(len(self.targets)):

518

if self.loads[idx] < self.hwm:

521

if self.loads[idx] < self.hwm:

519

available.append(idx)

522

available.append(idx)

520

return available

523

return available

521

524

522

def maybe_run(self, job):

525

def maybe_run(self, job):

523

"""check location dependencies, and run if they are met."""

526

"""check location dependencies, and run if they are met."""

524

msg_id = job.msg_id

527

msg_id = job.msg_id

525

self.log.debug("Attempting to assign task %s", msg_id)

528

self.log.debug("Attempting to assign task %s", msg_id)

526

available = self.available_engines()

529

available = self.available_engines()

527

if not available:

530

if not available:

528

# no engines, definitely can't run

531

# no engines, definitely can't run

529

return False

532

return False

530

533

531

if job.follow or job.targets or job.blacklist or self.hwm:

534

if job.follow or job.targets or job.blacklist or self.hwm:

532

# we need a can_run filter

535

# we need a can_run filter

533

def can_run(idx):

536

def can_run(idx):

534

# check hwm

537

# check hwm

535

if self.hwm and self.loads[idx] == self.hwm:

538

if self.hwm and self.loads[idx] == self.hwm:

536

return False

539

return False

537

target = self.targets[idx]

540

target = self.targets[idx]

538

# check blacklist

541

# check blacklist

539

if target in job.blacklist:

542

if target in job.blacklist:

540

return False

543

return False

541

# check targets

544

# check targets

542

if job.targets and target not in job.targets:

545

if job.targets and target not in job.targets:

543

return False

546

return False

544

# check follow

547

# check follow

545

return job.follow.check(self.completed[target], self.failed[target])

548

return job.follow.check(self.completed[target], self.failed[target])

546

549

547

indices = filter(can_run, available)

550

indices = filter(can_run, available)

548

551

549

if not indices:

552

if not indices:

550

# couldn't run

553

# couldn't run

551

if job.follow.all:

554

if job.follow.all:

552

# check follow for impossibility

555

# check follow for impossibility

553

dests = set()

556

dests = set()

554

relevant = set()

557

relevant = set()

555

if job.follow.success:

558

if job.follow.success:

556

relevant = self.all_completed

559

relevant = self.all_completed

557

if job.follow.failure:

560

if job.follow.failure:

558

relevant = relevant.union(self.all_failed)

561

relevant = relevant.union(self.all_failed)

559

for m in job.follow.intersection(relevant):

562

for m in job.follow.intersection(relevant):

560

dests.add(self.destinations[m])

563

dests.add(self.destinations[m])

561

if len(dests) > 1:

564

if len(dests) > 1:

562

self.queue_map[msg_id] = job

565

self.queue_map[msg_id] = job

563

self.fail_unreachable(msg_id)

566

self.fail_unreachable(msg_id)

564

return False

567

return False

565

if job.targets:

568

if job.targets:

566

# check blacklist+targets for impossibility

569

# check blacklist+targets for impossibility

567

job.targets.difference_update(job.blacklist)

570

job.targets.difference_update(job.blacklist)

568

if not job.targets or not job.targets.intersection(self.targets):

571

if not job.targets or not job.targets.intersection(self.targets):

569

self.queue_map[msg_id] = job

572

self.queue_map[msg_id] = job

570

self.fail_unreachable(msg_id)

573

self.fail_unreachable(msg_id)

571

return False

574

return False

572

return False

575

return False

573

else:

576

else:

574

indices = None

577

indices = None

575

578

576

self.submit_task(job, indices)

579

self.submit_task(job, indices)

577

return True

580

return True

578

581

579

def save_unmet(self, job):

582

def save_unmet(self, job):

580

"""Save a message for later submission when its dependencies are met."""

583

"""Save a message for later submission when its dependencies are met."""

581

msg_id = job.msg_id

584

msg_id = job.msg_id

582

self.log.debug("Adding task %s to the queue", msg_id)

585

self.log.debug("Adding task %s to the queue", msg_id)

583

self.queue_map[msg_id] = job

586

self.queue_map[msg_id] = job

584

~~heapq~~.~~heappush~~(self.queue, job)

587

self.queue.append(job)

585

# track the ids in follow or after, but not those already finished

588

# track the ids in follow or after, but not those already finished

586

for dep_id in job.after.union(job.follow).difference(self.all_done):

589

for dep_id in job.after.union(job.follow).difference(self.all_done):

587

if dep_id not in self.graph:

590

if dep_id not in self.graph:

588

self.graph[dep_id] = set()

591

self.graph[dep_id] = set()

589

self.graph[dep_id].add(msg_id)

592

self.graph[dep_id].add(msg_id)

590

593

591

def submit_task(self, job, indices=None):

594

def submit_task(self, job, indices=None):

592

"""Submit a task to any of a subset of our targets."""

595

"""Submit a task to any of a subset of our targets."""

593

if indices:

596

if indices:

594

loads = [self.loads[i] for i in indices]

597

loads = [self.loads[i] for i in indices]

595

else:

598

else:

596

loads = self.loads

599

loads = self.loads

597

idx = self.scheme(loads)

600

idx = self.scheme(loads)

598

if indices:

601

if indices:

599

idx = indices[idx]

602

idx = indices[idx]

600

target = self.targets[idx]

603

target = self.targets[idx]

601

# print (target, map(str, msg[:3]))

604

# print (target, map(str, msg[:3]))

602

# send job to the engine

605

# send job to the engine

603

self.engine_stream.send(target, flags=zmq.SNDMORE, copy=False)

606

self.engine_stream.send(target, flags=zmq.SNDMORE, copy=False)

604

self.engine_stream.send_multipart(job.raw_msg, copy=False)

607

self.engine_stream.send_multipart(job.raw_msg, copy=False)

605

# update load

608

# update load

606

self.add_job(idx)

609

self.add_job(idx)

607

self.pending[target][job.msg_id] = job

610

self.pending[target][job.msg_id] = job

608

# notify Hub

611

# notify Hub

609

content = dict(msg_id=job.msg_id, engine_id=target.decode('ascii'))

612

content = dict(msg_id=job.msg_id, engine_id=target.decode('ascii'))

610

self.session.send(self.mon_stream, 'task_destination', content=content,

613

self.session.send(self.mon_stream, 'task_destination', content=content,

611

ident=[b'tracktask',self.ident])

614

ident=[b'tracktask',self.ident])

612

615

613

616

614

#-----------------------------------------------------------------------

617

#-----------------------------------------------------------------------

615

# Result Handling

618

# Result Handling

616

#-----------------------------------------------------------------------

619

#-----------------------------------------------------------------------

617

620

618

621

619

@util.log_errors

622

@util.log_errors

620

def dispatch_result(self, raw_msg):

623

def dispatch_result(self, raw_msg):

621

"""dispatch method for result replies"""

624

"""dispatch method for result replies"""

622

try:

625

try:

623

idents,msg = self.session.feed_identities(raw_msg, copy=False)

626

idents,msg = self.session.feed_identities(raw_msg, copy=False)

624

msg = self.session.unserialize(msg, content=False, copy=False)

627

msg = self.session.unserialize(msg, content=False, copy=False)

625

engine = idents[0]

628

engine = idents[0]

626

try:

629

try:

627

idx = self.targets.index(engine)

630

idx = self.targets.index(engine)

628

except ValueError:

631

except ValueError:

629

pass # skip load-update for dead engines

632

pass # skip load-update for dead engines

630

else:

633

else:

631

self.finish_job(idx)

634

self.finish_job(idx)

632

except Exception:

635

except Exception:

633

self.log.error("task::Invaid result: %r", raw_msg, exc_info=True)

636

self.log.error("task::Invaid result: %r", raw_msg, exc_info=True)

634

return

637

return

635

638

636

md = msg['metadata']

639

md = msg['metadata']

637

parent = msg['parent_header']

640

parent = msg['parent_header']

638

if md.get('dependencies_met', True):

641

if md.get('dependencies_met', True):

639

success = (md['status'] == 'ok')

642

success = (md['status'] == 'ok')

640

msg_id = parent['msg_id']

643

msg_id = parent['msg_id']

641

retries = self.retries[msg_id]

644

retries = self.retries[msg_id]

642

if not success and retries > 0:

645

if not success and retries > 0:

643

# failed

646

# failed

644

self.retries[msg_id] = retries - 1

647

self.retries[msg_id] = retries - 1

645

self.handle_unmet_dependency(idents, parent)

648

self.handle_unmet_dependency(idents, parent)

646

else:

649

else:

647

del self.retries[msg_id]

650

del self.retries[msg_id]

648

# relay to client and update graph

651

# relay to client and update graph

649

self.handle_result(idents, parent, raw_msg, success)

652

self.handle_result(idents, parent, raw_msg, success)

650

# send to Hub monitor

653

# send to Hub monitor

651

self.mon_stream.send_multipart([b'outtask']+raw_msg, copy=False)

654

self.mon_stream.send_multipart([b'outtask']+raw_msg, copy=False)

652

else:

655

else:

653

self.handle_unmet_dependency(idents, parent)

656

self.handle_unmet_dependency(idents, parent)

654

657

655

def handle_result(self, idents, parent, raw_msg, success=True):

658

def handle_result(self, idents, parent, raw_msg, success=True):

656

"""handle a real task result, either success or failure"""

659

"""handle a real task result, either success or failure"""

657

# first, relay result to client

660

# first, relay result to client

658

engine = idents[0]

661

engine = idents[0]

659

client = idents[1]

662

client = idents[1]

660

# swap_ids for ROUTER-ROUTER mirror

663

# swap_ids for ROUTER-ROUTER mirror

661

raw_msg[:2] = [client,engine]

664

raw_msg[:2] = [client,engine]

662

# print (map(str, raw_msg[:4]))

665

# print (map(str, raw_msg[:4]))

663

self.client_stream.send_multipart(raw_msg, copy=False)

666

self.client_stream.send_multipart(raw_msg, copy=False)

664

# now, update our data structures

667

# now, update our data structures

665

msg_id = parent['msg_id']

668

msg_id = parent['msg_id']

666

self.pending[engine].pop(msg_id)

669

self.pending[engine].pop(msg_id)

667

if success:

670

if success:

668

self.completed[engine].add(msg_id)

671

self.completed[engine].add(msg_id)

669

self.all_completed.add(msg_id)

672

self.all_completed.add(msg_id)

670

else:

673

else:

671

self.failed[engine].add(msg_id)

674

self.failed[engine].add(msg_id)

672

self.all_failed.add(msg_id)

675

self.all_failed.add(msg_id)

673

self.all_done.add(msg_id)

676

self.all_done.add(msg_id)

674

self.destinations[msg_id] = engine

677

self.destinations[msg_id] = engine

675

678

676

self.update_graph(msg_id, success)

679

self.update_graph(msg_id, success)

677

680

678

def handle_unmet_dependency(self, idents, parent):

681

def handle_unmet_dependency(self, idents, parent):

679

"""handle an unmet dependency"""

682

"""handle an unmet dependency"""

680

engine = idents[0]

683

engine = idents[0]

681

msg_id = parent['msg_id']

684

msg_id = parent['msg_id']

682

685

683

job = self.pending[engine].pop(msg_id)

686

job = self.pending[engine].pop(msg_id)

684

job.blacklist.add(engine)

687

job.blacklist.add(engine)

685

688

686

if job.blacklist == job.targets:

689

if job.blacklist == job.targets:

687

self.queue_map[msg_id] = job

690

self.queue_map[msg_id] = job

688

self.fail_unreachable(msg_id)

691

self.fail_unreachable(msg_id)

689

elif not self.maybe_run(job):

692

elif not self.maybe_run(job):

690

# resubmit failed

693

# resubmit failed

691

if msg_id not in self.all_failed:

694

if msg_id not in self.all_failed:

692

# put it back in our dependency tree

695

# put it back in our dependency tree

693

self.save_unmet(job)

696

self.save_unmet(job)

694

697

695

if self.hwm:

698

if self.hwm:

696

try:

699

try:

697

idx = self.targets.index(engine)

700

idx = self.targets.index(engine)

698

except ValueError:

701

except ValueError:

699

pass # skip load-update for dead engines

702

pass # skip load-update for dead engines

700

else:

703

else:

701

if self.loads[idx] == self.hwm-1:

704

if self.loads[idx] == self.hwm-1:

702

self.update_graph(None)

705

self.update_graph(None)

703

706

704

def update_graph(self, dep_id=None, success=True):

707

def update_graph(self, dep_id=None, success=True):

705

"""dep_id just finished. Update our dependency

708

"""dep_id just finished. Update our dependency

706

graph and submit any jobs that just became runnable.

709

graph and submit any jobs that just became runnable.

707

710

708

Called with dep_id=None to update entire graph for hwm, but without finishing a task.

711

Called with dep_id=None to update entire graph for hwm, but without finishing a task.

709

"""

712

"""

710

# print ("\n\n***********")

713

# print ("\n\n***********")

711

# pprint (dep_id)

714

# pprint (dep_id)

712

# pprint (self.graph)

715

# pprint (self.graph)

713

# pprint (self.queue_map)

716

# pprint (self.queue_map)

714

# pprint (self.all_completed)

717

# pprint (self.all_completed)

715

# pprint (self.all_failed)

718

# pprint (self.all_failed)

716

# print ("\n\n***********\n\n")

719

# print ("\n\n***********\n\n")

717

# update any jobs that depended on the dependency

720

# update any jobs that depended on the dependency

718

msg_ids = self.graph.pop(dep_id, [])

721

msg_ids = self.graph.pop(dep_id, [])

719

722

720

# recheck *all* jobs if

723

# recheck *all* jobs if

721

# a) we have HWM and an engine just become no longer full

724

# a) we have HWM and an engine just become no longer full

722

# or b) dep_id was given as None

725

# or b) dep_id was given as None

723

726

724

if dep_id is None or self.hwm and any( [ load==self.hwm-1 for load in self.loads ]):

727

if dep_id is None or self.hwm and any( [ load==self.hwm-1 for load in self.loads ]):

725

jobs = self.queue

728

jobs = self.queue

726

using_queue = True

729

using_queue = True

727

else:

730

else:

728

using_queue = False

731

using_queue = False

729

jobs = ~~heapq~~.~~heapify~~([ self.queue_map[msg_id] for msg_id in msg_ids ])

732

jobs = deque(sorted( self.queue_map[msg_id] for msg_id in msg_ids ))

730

733

731

to_restore = []

734

to_restore = []

732

while jobs:

735

while jobs:

733

job = ~~heapq~~.~~heap~~pop(~~jobs~~)

736

job = jobs.popleft()

734

if job.removed:

737

if job.removed:

735

continue

738

continue

736

msg_id = job.msg_id

739

msg_id = job.msg_id

737

740

738

put_it_back = True

741

put_it_back = True

739

742

740

if job.after.unreachable(self.all_completed, self.all_failed)\

743

if job.after.unreachable(self.all_completed, self.all_failed)\

741

or job.follow.unreachable(self.all_completed, self.all_failed):

744

or job.follow.unreachable(self.all_completed, self.all_failed):

742

self.fail_unreachable(msg_id)

745

self.fail_unreachable(msg_id)

743

put_it_back = False

746

put_it_back = False

744

747

745

elif job.after.check(self.all_completed, self.all_failed): # time deps met, maybe run

748

elif job.after.check(self.all_completed, self.all_failed): # time deps met, maybe run

746

if self.maybe_run(job):

749

if self.maybe_run(job):

747

put_it_back = False

750

put_it_back = False

748

self.queue_map.pop(msg_id)

751

self.queue_map.pop(msg_id)

749

for mid in job.dependents:

752

for mid in job.dependents:

750

if mid in self.graph:

753

if mid in self.graph:

751

self.graph[mid].remove(msg_id)

754

self.graph[mid].remove(msg_id)

752

755

753

# abort the loop if we just filled up all of our engines.

756

# abort the loop if we just filled up all of our engines.

754

# avoids an O(N) operation in situation of full queue,

757

# avoids an O(N) operation in situation of full queue,

755

# where graph update is triggered as soon as an engine becomes

758

# where graph update is triggered as soon as an engine becomes

756

# non-full, and all tasks after the first are checked,

759

# non-full, and all tasks after the first are checked,

757

# even though they can't run.

760

# even though they can't run.

758

if not self.available_engines():

761

if not self.available_engines():

759

break

762

break

760

763

761

if using_queue and put_it_back:

764

if using_queue and put_it_back:

762

# popped a job from the queue but it neither ran nor failed,

765

# popped a job from the queue but it neither ran nor failed,

763

# so we need to put it back when we are done

766

# so we need to put it back when we are done

767

# make sure to_restore preserves the same ordering

764

to_restore.append(job)

768

to_restore.append(job)

765

769

766

# put back any tasks we popped but didn't run

770

# put back any tasks we popped but didn't run

767

for ~~job~~ in ~~to_restor~~e:

771

if using_queue:

768

heapq.heappush(self.queue, job)

772

self.queue.extendleft(to_restore)

769

773

770

771

#----------------------------------------------------------------------

774

#----------------------------------------------------------------------

772

# methods to be overridden by subclasses

775

# methods to be overridden by subclasses

773

#----------------------------------------------------------------------

776

#----------------------------------------------------------------------

774

777

775

def add_job(self, idx):

778

def add_job(self, idx):

776

"""Called after self.targets[idx] just got the job with header.

779

"""Called after self.targets[idx] just got the job with header.

777

Override with subclasses. The default ordering is simple LRU.

780

Override with subclasses. The default ordering is simple LRU.

778

The default loads are the number of outstanding jobs."""

781

The default loads are the number of outstanding jobs."""

779

self.loads[idx] += 1

782

self.loads[idx] += 1

780

for lis in (self.targets, self.loads):

783

for lis in (self.targets, self.loads):

781

lis.append(lis.pop(idx))

784

lis.append(lis.pop(idx))

782

785

783

786

784

def finish_job(self, idx):

787

def finish_job(self, idx):

785

"""Called after self.targets[idx] just finished a job.

788

"""Called after self.targets[idx] just finished a job.

786

Override with subclasses."""

789

Override with subclasses."""

787

self.loads[idx] -= 1

790

self.loads[idx] -= 1

788

791

789

792

790

793

791

def launch_scheduler(in_addr, out_addr, mon_addr, not_addr, reg_addr, config=None,

794

def launch_scheduler(in_addr, out_addr, mon_addr, not_addr, reg_addr, config=None,

792

logname='root', log_url=None, loglevel=logging.DEBUG,

795

logname='root', log_url=None, loglevel=logging.DEBUG,

793

identity=b'task', in_thread=False):

796

identity=b'task', in_thread=False):

794

797

795

ZMQStream = zmqstream.ZMQStream

798

ZMQStream = zmqstream.ZMQStream

796

loglevel = logging.DEBUG

799

loglevel = logging.DEBUG

797

if config:

800

if config:

798

# unwrap dict back into Config

801

# unwrap dict back into Config

799

config = Config(config)

802

config = Config(config)

800

803

801

if in_thread:

804

if in_thread:

802

# use instance() to get the same Context/Loop as our parent

805

# use instance() to get the same Context/Loop as our parent

803

ctx = zmq.Context.instance()

806

ctx = zmq.Context.instance()

804

loop = ioloop.IOLoop.instance()

807

loop = ioloop.IOLoop.instance()

805

else:

808

else:

806

# in a process, don't use instance()

809

# in a process, don't use instance()

807

# for safety with multiprocessing

810

# for safety with multiprocessing

808

ctx = zmq.Context()

811

ctx = zmq.Context()

809

loop = ioloop.IOLoop()

812

loop = ioloop.IOLoop()

810

ins = ZMQStream(ctx.socket(zmq.ROUTER),loop)

813

ins = ZMQStream(ctx.socket(zmq.ROUTER),loop)

811

ins.setsockopt(zmq.IDENTITY, identity + b'_in')

814

ins.setsockopt(zmq.IDENTITY, identity + b'_in')

812

ins.bind(in_addr)

815

ins.bind(in_addr)

813

816

814

outs = ZMQStream(ctx.socket(zmq.ROUTER),loop)

817

outs = ZMQStream(ctx.socket(zmq.ROUTER),loop)

815

outs.setsockopt(zmq.IDENTITY, identity + b'_out')

818

outs.setsockopt(zmq.IDENTITY, identity + b'_out')

816

outs.bind(out_addr)

819

outs.bind(out_addr)

817

mons = zmqstream.ZMQStream(ctx.socket(zmq.PUB),loop)

820

mons = zmqstream.ZMQStream(ctx.socket(zmq.PUB),loop)

818

mons.connect(mon_addr)

821

mons.connect(mon_addr)

819

nots = zmqstream.ZMQStream(ctx.socket(zmq.SUB),loop)

822

nots = zmqstream.ZMQStream(ctx.socket(zmq.SUB),loop)

820

nots.setsockopt(zmq.SUBSCRIBE, b'')

823

nots.setsockopt(zmq.SUBSCRIBE, b'')

821

nots.connect(not_addr)

824

nots.connect(not_addr)

822

825

823

querys = ZMQStream(ctx.socket(zmq.DEALER),loop)

826

querys = ZMQStream(ctx.socket(zmq.DEALER),loop)

824

querys.connect(reg_addr)

827

querys.connect(reg_addr)

825

828

826

# setup logging.

829

# setup logging.

827

if in_thread:

830

if in_thread:

828

log = Application.instance().log

831

log = Application.instance().log

829

else:

832

else:

830

if log_url:

833

if log_url:

831

log = connect_logger(logname, ctx, log_url, root="scheduler", loglevel=loglevel)

834

log = connect_logger(logname, ctx, log_url, root="scheduler", loglevel=loglevel)

832

else:

835

else:

833

log = local_logger(logname, loglevel)

836

log = local_logger(logname, loglevel)

834

837

835

scheduler = TaskScheduler(client_stream=ins, engine_stream=outs,

838

scheduler = TaskScheduler(client_stream=ins, engine_stream=outs,

836

mon_stream=mons, notifier_stream=nots,

839

mon_stream=mons, notifier_stream=nots,

837

query_stream=querys,

840

query_stream=querys,

838

loop=loop, log=log,

841

loop=loop, log=log,

839

config=config)

842

config=config)

840

scheduler.start()

843

scheduler.start()

841

if not in_thread:

844

if not in_thread:

842

try:

845

try:

843

loop.start()

846

loop.start()

844

except KeyboardInterrupt:

847

except KeyboardInterrupt:

845

scheduler.log.critical("Interrupted, exiting...")

848

scheduler.log.critical("Interrupted, exiting...")

846

849

	Site-wide shortcuts
/	Use quick search box
g h	Goto home page
g g	Goto my private gists page
g G	Goto my public gists page
g 0-9	Goto bookmarked items from 0-9
n r	New repository page
n g	New gist page

	Repositories
g s	Goto summary page
g c	Goto changelog page
g f	Goto files page
g F	Goto files page with file search activated
g p	Goto pull requests page
g o	Goto repository settings
g O	Goto repository access permissions settings
t s	Toggle sidebar on some pages

             """The Python scheduler for rich scheduling.
             The Pure ZMQ scheduler does not allow routing schemes other than LRU,
             nor does it check msg_id DAG dependencies. For those, a slightly slower
             Python Scheduler exists.
             Authors:
             * Min RK
             """
             #-----------------------------------------------------------------------------
             #  Copyright (C) 2010-2011  The IPython Development Team
             #
             #  Distributed under the terms of the BSD License.  The full license is in
             #  the file COPYING, distributed as part of this software.
             #-----------------------------------------------------------------------------
             #----------------------------------------------------------------------
             # Imports
             #----------------------------------------------------------------------
-            import heapq
             import logging
             import sys
             import time
-            from datetime import datetime, timedelta
+            from collections import deque
+            from datetime import datetime
             from random import randint, random
             from types import FunctionType
             try:
                 import numpy
             except ImportError:
                 numpy = None
             import zmq
             from zmq.eventloop import ioloop, zmqstream
             # local imports
             from IPython.external.decorator import decorator
             from IPython.config.application import Application
             from IPython.config.loader import Config
             from IPython.utils.traitlets import Instance, Dict, List, Set, Integer, Enum, CBytes
             from IPython.utils.py3compat import cast_bytes
             from IPython.parallel import error, util
             from IPython.parallel.factory import SessionFactory
             from IPython.parallel.util import connect_logger, local_logger
             from .dependency import Dependency
             @decorator
             def logged(f,self,*args,**kwargs):
                 # print ("#--------------------")
                 self.log.debug("scheduler::%s(*%s,**%s)", f.func_name, args, kwargs)
                 # print ("#--")
                 return f(self,*args, **kwargs)
             #----------------------------------------------------------------------
             # Chooser functions
             #----------------------------------------------------------------------
             def plainrandom(loads):
                 """Plain random pick."""
                 n = len(loads)
                 return randint(0,n-1)
             def lru(loads):
                 """Always pick the front of the line.
                 The content of `loads` is ignored.
                 Assumes LRU ordering of loads, with oldest first.
                 """
                 return 0
             def twobin(loads):
                 """Pick two at random, use the LRU of the two.
                 The content of loads is ignored.
                 Assumes LRU ordering of loads, with oldest first.
                 """
                 n = len(loads)
                 a = randint(0,n-1)
                 b = randint(0,n-1)
                 return min(a,b)
             def weighted(loads):
                 """Pick two at random using inverse load as weight.
                 Return the less loaded of the two.
                 """
                 # weight 0 a million times more than 1:
                 weights = 1./(1e-6+numpy.array(loads))
                 sums = weights.cumsum()
                 t = sums[-1]
                 x = random()*t
                 y = random()*t
                 idx = 0
                 idy = 0
                 while sums[idx] < x:
                     idx += 1
                 while sums[idy] < y:
                     idy += 1
                 if weights[idy] > weights[idx]:
                     return idy
                 else:
                     return idx
             def leastload(loads):
                 """Always choose the lowest load.
                 If the lowest load occurs more than once, the first
                 occurance will be used.  If loads has LRU ordering, this means
                 the LRU of those with the lowest load is chosen.
                 """
                 return loads.index(min(loads))
             #---------------------------------------------------------------------
             # Classes
             #---------------------------------------------------------------------
             # store empty default dependency:
             MET = Dependency([])
             class Job(object):
                 """Simple container for a job"""
                 def __init__(self, msg_id, raw_msg, idents, msg, header, metadata,
                                 targets, after, follow, timeout):
                     self.msg_id = msg_id
                     self.raw_msg = raw_msg
                     self.idents = idents
                     self.msg = msg
                     self.header = header
                     self.metadata = metadata
                     self.targets = targets
                     self.after = after
                     self.follow = follow
                     self.timeout = timeout
-                    self.removed = False # used for lazy-delete in heap-sorted queue
+                    self.removed = False # used for lazy-delete from sorted queue
                     self.timestamp = time.time()
                     self.blacklist = set()
                 def __lt__(self, other):
                     return self.timestamp < other.timestamp
                 def __cmp__(self, other):
                     return cmp(self.timestamp, other.timestamp)
                 @property
                 def dependents(self):
                     return self.follow.union(self.after)
             class TaskScheduler(SessionFactory):
                 """Python TaskScheduler object.
                 This is the simplest object that supports msg_id based
                 DAG dependencies. *Only* task msg_ids are checked, not
                 msg_ids of jobs submitted via the MUX queue.
                 """
                 hwm = Integer(1, config=True,
                     help="""specify the High Water Mark (HWM) for the downstream
                     socket in the Task scheduler. This is the maximum number
                     of allowed outstanding tasks on each engine.
                     The default (1) means that only one task can be outstanding on each
                     engine.  Setting TaskScheduler.hwm=0 means there is no limit, and the
                     engines continue to be assigned tasks while they are working,
                     effectively hiding network latency behind computation, but can result
                     in an imbalance of work when submitting many heterogenous tasks all at
                     once.  Any positive value greater than one is a compromise between the
                     two.
                     """
                 )
                 scheme_name = Enum(('leastload', 'pure', 'lru', 'plainrandom', 'weighted', 'twobin'),
                     'leastload', config=True, allow_none=False,
                     help="""select the task scheduler scheme  [default: Python LRU]
                     Options are: 'pure', 'lru', 'plainrandom', 'weighted', 'twobin','leastload'"""
                 )
                 def _scheme_name_changed(self, old, new):
                     self.log.debug("Using scheme %r"%new)
                     self.scheme = globals()[new]
                 # input arguments:
                 scheme = Instance(FunctionType) # function for determining the destination
                 def _scheme_default(self):
                     return leastload
                 client_stream = Instance(zmqstream.ZMQStream) # client-facing stream
                 engine_stream = Instance(zmqstream.ZMQStream) # engine-facing stream
                 notifier_stream = Instance(zmqstream.ZMQStream) # hub-facing sub stream
                 mon_stream = Instance(zmqstream.ZMQStream) # hub-facing pub stream
                 query_stream = Instance(zmqstream.ZMQStream) # hub-facing DEALER stream
                 # internals:
-                queue = List() # heap-sorted list of Jobs
+                queue = Instance(deque) # sorted list of Jobs
+                def _queue_default(self):
+                    return deque()
                 queue_map = Dict() # dict by msg_id of Jobs (for O(1) access to the Queue)
                 graph = Dict() # dict by msg_id of [ msg_ids that depend on key ]
                 retries = Dict() # dict by msg_id of retries remaining (non-neg ints)
                 # waiting = List() # list of msg_ids ready to run, but haven't due to HWM
                 pending = Dict() # dict by engine_uuid of submitted tasks
                 completed = Dict() # dict by engine_uuid of completed tasks
                 failed = Dict() # dict by engine_uuid of failed tasks
                 destinations = Dict() # dict by msg_id of engine_uuids where jobs ran (reverse of completed+failed)
                 clients = Dict() # dict by msg_id for who submitted the task
                 targets = List() # list of target IDENTs
                 loads = List() # list of engine loads
                 # full = Set() # set of IDENTs that have HWM outstanding tasks
                 all_completed = Set() # set of all completed tasks
                 all_failed = Set() # set of all failed tasks
                 all_done = Set() # set of all finished tasks=union(completed,failed)
                 all_ids = Set() # set of all submitted task IDs
                 ident = CBytes() # ZMQ identity. This should just be self.session.session
                                  # but ensure Bytes
                 def _ident_default(self):
                     return self.session.bsession
                 def start(self):
                     self.query_stream.on_recv(self.dispatch_query_reply)
                     self.session.send(self.query_stream, "connection_request", {})
                     self.engine_stream.on_recv(self.dispatch_result, copy=False)
                     self.client_stream.on_recv(self.dispatch_submission, copy=False)
                     self._notification_handlers = dict(
                         registration_notification = self._register_engine,
                         unregistration_notification = self._unregister_engine
                     )
                     self.notifier_stream.on_recv(self.dispatch_notification)
                     self.log.info("Scheduler started [%s]" % self.scheme_name)
                 def resume_receiving(self):
                     """Resume accepting jobs."""
                     self.client_stream.on_recv(self.dispatch_submission, copy=False)
                 def stop_receiving(self):
                     """Stop accepting jobs while there are no engines.
                     Leave them in the ZMQ queue."""
                     self.client_stream.on_recv(None)
                 #-----------------------------------------------------------------------
                 # [Un]Registration Handling
                 #-----------------------------------------------------------------------
                 def dispatch_query_reply(self, msg):
                     """handle reply to our initial connection request"""
                     try:
                         idents,msg = self.session.feed_identities(msg)
                     except ValueError:
                         self.log.warn("task::Invalid Message: %r",msg)
                         return
                     try:
                         msg = self.session.unserialize(msg)
                     except ValueError:
                         self.log.warn("task::Unauthorized message from: %r"%idents)
                         return
                     content = msg['content']
                     for uuid in content.get('engines', {}).values():
                         self._register_engine(cast_bytes(uuid))
                 @util.log_errors
                 def dispatch_notification(self, msg):
                     """dispatch register/unregister events."""
                     try:
                         idents,msg = self.session.feed_identities(msg)
                     except ValueError:
                         self.log.warn("task::Invalid Message: %r",msg)
                         return
                     try:
                         msg = self.session.unserialize(msg)
                     except ValueError:
                         self.log.warn("task::Unauthorized message from: %r"%idents)
                         return
                     msg_type = msg['header']['msg_type']
                     handler = self._notification_handlers.get(msg_type, None)
                     if handler is None:
                         self.log.error("Unhandled message type: %r"%msg_type)
                     else:
                         try:
                             handler(cast_bytes(msg['content']['uuid']))
                         except Exception:
                             self.log.error("task::Invalid notification msg: %r", msg, exc_info=True)
                 def _register_engine(self, uid):
                     """New engine with ident `uid` became available."""
                     # head of the line:
                     self.targets.insert(0,uid)
                     self.loads.insert(0,0)
                     # initialize sets
                     self.completed[uid] = set()
                     self.failed[uid] = set()
                     self.pending[uid] = {}
                     # rescan the graph:
                     self.update_graph(None)
                 def _unregister_engine(self, uid):
                     """Existing engine with ident `uid` became unavailable."""
                     if len(self.targets) == 1:
                         # this was our only engine
                         pass
                     # handle any potentially finished tasks:
                     self.engine_stream.flush()
                     # don't pop destinations, because they might be used later
                     # map(self.destinations.pop, self.completed.pop(uid))
                     # map(self.destinations.pop, self.failed.pop(uid))
                     # prevent this engine from receiving work
                     idx = self.targets.index(uid)
                     self.targets.pop(idx)
                     self.loads.pop(idx)
                     # wait 5 seconds before cleaning up pending jobs, since the results might
                     # still be incoming
                     if self.pending[uid]:
                         dc = ioloop.DelayedCallback(lambda : self.handle_stranded_tasks(uid), 5000, self.loop)
                         dc.start()
                     else:
                         self.completed.pop(uid)
                         self.failed.pop(uid)
                 def handle_stranded_tasks(self, engine):
                     """Deal with jobs resident in an engine that died."""
                     lost = self.pending[engine]
                     for msg_id in lost.keys():
                         if msg_id not in self.pending[engine]:
                             # prevent double-handling of messages
                             continue
                         raw_msg = lost[msg_id].raw_msg
                         idents,msg = self.session.feed_identities(raw_msg, copy=False)
                         parent = self.session.unpack(msg[1].bytes)
                         idents = [engine, idents[0]]
                         # build fake error reply
                         try:
                             raise error.EngineError("Engine %r died while running task %r"%(engine, msg_id))
                         except:
                             content = error.wrap_exception()
                         # build fake metadata
                         md = dict(
                             status=u'error',
                             engine=engine,
                             date=datetime.now(),
                         )
                         msg = self.session.msg('apply_reply', content, parent=parent, metadata=md)
                         raw_reply = map(zmq.Message, self.session.serialize(msg, ident=idents))
                         # and dispatch it
                         self.dispatch_result(raw_reply)
                     # finally scrub completed/failed lists
                     self.completed.pop(engine)
                     self.failed.pop(engine)
                 #-----------------------------------------------------------------------
                 # Job Submission
                 #-----------------------------------------------------------------------
                 @util.log_errors
                 def dispatch_submission(self, raw_msg):
                     """Dispatch job submission to appropriate handlers."""
                     # ensure targets up to date:
                     self.notifier_stream.flush()
                     try:
                         idents, msg = self.session.feed_identities(raw_msg, copy=False)
                         msg = self.session.unserialize(msg, content=False, copy=False)
                     except Exception:
                         self.log.error("task::Invaid task msg: %r"%raw_msg, exc_info=True)
                         return
                     # send to monitor
                     self.mon_stream.send_multipart([b'intask']+raw_msg, copy=False)
                     header = msg['header']
                     md = msg['metadata']
                     msg_id = header['msg_id']
                     self.all_ids.add(msg_id)
                     # get targets as a set of bytes objects
                     # from a list of unicode objects
                     targets = md.get('targets', [])
                     targets = map(cast_bytes, targets)
                     targets = set(targets)
                     retries = md.get('retries', 0)
                     self.retries[msg_id] = retries
                     # time dependencies
                     after = md.get('after', None)
                     if after:
                         after = Dependency(after)
                         if after.all:
                             if after.success:
                                 after = Dependency(after.difference(self.all_completed),
                                             success=after.success,
                                             failure=after.failure,
                                             all=after.all,
                                 )
                             if after.failure:
                                 after = Dependency(after.difference(self.all_failed),
                                             success=after.success,
                                             failure=after.failure,
                                             all=after.all,
                                 )
                         if after.check(self.all_completed, self.all_failed):
                             # recast as empty set, if `after` already met,
                             # to prevent unnecessary set comparisons
                             after = MET
                     else:
                         after = MET
                     # location dependencies
                     follow = Dependency(md.get('follow', []))
                     # turn timeouts into datetime objects:
                     timeout = md.get('timeout', None)
                     if timeout:
                         timeout = time.time() + float(timeout)
                     job = Job(msg_id=msg_id, raw_msg=raw_msg, idents=idents, msg=msg,
                              header=header, targets=targets, after=after, follow=follow,
                              timeout=timeout, metadata=md,
                     )
                     if timeout:
                         # schedule timeout callback
                         self.loop.add_timeout(timeout, lambda : self.job_timeout(job))
                     # validate and reduce dependencies:
                     for dep in after,follow:
                         if not dep: # empty dependency
                             continue
                         # check valid:
                         if msg_id in dep or dep.difference(self.all_ids):
                             self.queue_map[msg_id] = job
                             return self.fail_unreachable(msg_id, error.InvalidDependency)
                         # check if unreachable:
                         if dep.unreachable(self.all_completed, self.all_failed):
                             self.queue_map[msg_id] = job
                             return self.fail_unreachable(msg_id)
                     if after.check(self.all_completed, self.all_failed):
                         # time deps already met, try to run
                         if not self.maybe_run(job):
                             # can't run yet
                             if msg_id not in self.all_failed:
                                 # could have failed as unreachable
                                 self.save_unmet(job)
                     else:
                         self.save_unmet(job)
                 def job_timeout(self, job):
                     """callback for a job's timeout.
                     The job may or may not have been run at this point.
                     """
-                    if job.timeout >= (time.time() + 1):
+                    now = time.time()
+                    if job.timeout >= (now + 1):
                         self.log.warn("task %s timeout fired prematurely: %s > %s",
                             job.msg_id, job.timeout, now
                         )
                     if job.msg_id in self.queue_map:
                         # still waiting, but ran out of time
                         self.log.info("task %r timed out", job.msg_id)
                         self.fail_unreachable(job.msg_id, error.TaskTimeout)
                 def fail_unreachable(self, msg_id, why=error.ImpossibleDependency):
                     """a task has become unreachable, send a reply with an ImpossibleDependency
                     error."""
                     if msg_id not in self.queue_map:
                         self.log.error("task %r already failed!", msg_id)
                         return
                     job = self.queue_map.pop(msg_id)
                     # lazy-delete from the queue
                     job.removed = True
                     for mid in job.dependents:
                         if mid in self.graph:
                             self.graph[mid].remove(msg_id)
                     try:
                         raise why()
                     except:
                         content = error.wrap_exception()
                     self.log.debug("task %r failing as unreachable with: %s", msg_id, content['ename'])
                     self.all_done.add(msg_id)
                     self.all_failed.add(msg_id)
                     msg = self.session.send(self.client_stream, 'apply_reply', content,
                                                             parent=job.header, ident=job.idents)
                     self.session.send(self.mon_stream, msg, ident=[b'outtask']+job.idents)
                     self.update_graph(msg_id, success=False)
                 def available_engines(self):
                     """return a list of available engine indices based on HWM"""
                     if not self.hwm:
                         return range(len(self.targets))
                     available = []
                     for idx in range(len(self.targets)):
                         if self.loads[idx] < self.hwm:
                             available.append(idx)
                     return available
                 def maybe_run(self, job):
                     """check location dependencies, and run if they are met."""
                     msg_id = job.msg_id
                     self.log.debug("Attempting to assign task %s", msg_id)
                     available = self.available_engines()
                     if not available:
                         # no engines, definitely can't run
                         return False
                     if job.follow or job.targets or job.blacklist or self.hwm:
                         # we need a can_run filter
                         def can_run(idx):
                             # check hwm
                             if self.hwm and self.loads[idx] == self.hwm:
                                 return False
                             target = self.targets[idx]
                             # check blacklist
                             if target in job.blacklist:
                                 return False
                             # check targets
                             if job.targets and target not in job.targets:
                                 return False
                             # check follow
                             return job.follow.check(self.completed[target], self.failed[target])
                         indices = filter(can_run, available)
                         if not indices:
                             # couldn't run
                             if job.follow.all:
                                 # check follow for impossibility
                                 dests = set()
                                 relevant = set()
                                 if job.follow.success:
                                     relevant = self.all_completed
                                 if job.follow.failure:
                                     relevant = relevant.union(self.all_failed)
                                 for m in job.follow.intersection(relevant):
                                     dests.add(self.destinations[m])
                                 if len(dests) > 1:
                                     self.queue_map[msg_id] = job
                                     self.fail_unreachable(msg_id)
                                     return False
                             if job.targets:
                                 # check blacklist+targets for impossibility
                                 job.targets.difference_update(job.blacklist)
                                 if not job.targets or not job.targets.intersection(self.targets):
                                     self.queue_map[msg_id] = job
                                     self.fail_unreachable(msg_id)
                                     return False
                             return False
                     else:
                         indices = None
                     self.submit_task(job, indices)
                     return True
                 def save_unmet(self, job):
                     """Save a message for later submission when its dependencies are met."""
                     msg_id = job.msg_id
                     self.log.debug("Adding task %s to the queue", msg_id)
                     self.queue_map[msg_id] = job
-                    heapq.heappush(self.queue, job)
+                    self.queue.append(job)
                     # track the ids in follow or after, but not those already finished
                     for dep_id in job.after.union(job.follow).difference(self.all_done):
                         if dep_id not in self.graph:
                             self.graph[dep_id] = set()
                         self.graph[dep_id].add(msg_id)
                 def submit_task(self, job, indices=None):
                     """Submit a task to any of a subset of our targets."""
                     if indices:
                         loads = [self.loads[i] for i in indices]
                     else:
                         loads = self.loads
                     idx = self.scheme(loads)
                     if indices:
                         idx = indices[idx]
                     target = self.targets[idx]
                     # print (target, map(str, msg[:3]))
                     # send job to the engine
                     self.engine_stream.send(target, flags=zmq.SNDMORE, copy=False)
                     self.engine_stream.send_multipart(job.raw_msg, copy=False)
                     # update load
                     self.add_job(idx)
                     self.pending[target][job.msg_id] = job
                     # notify Hub
                     content = dict(msg_id=job.msg_id, engine_id=target.decode('ascii'))
                     self.session.send(self.mon_stream, 'task_destination', content=content,
                                     ident=[b'tracktask',self.ident])
                 #-----------------------------------------------------------------------
                 # Result Handling
                 #-----------------------------------------------------------------------
                 @util.log_errors
                 def dispatch_result(self, raw_msg):
                     """dispatch method for result replies"""
                     try:
                         idents,msg = self.session.feed_identities(raw_msg, copy=False)
                         msg = self.session.unserialize(msg, content=False, copy=False)
                         engine = idents[0]
                         try:
                             idx = self.targets.index(engine)
                         except ValueError:
                             pass # skip load-update for dead engines
                         else:
                             self.finish_job(idx)
                     except Exception:
                         self.log.error("task::Invaid result: %r", raw_msg, exc_info=True)
                         return
                     md = msg['metadata']
                     parent = msg['parent_header']
                     if md.get('dependencies_met', True):
                         success = (md['status'] == 'ok')
                         msg_id = parent['msg_id']
                         retries = self.retries[msg_id]
                         if not success and retries > 0:
                             # failed
                             self.retries[msg_id] = retries - 1
                             self.handle_unmet_dependency(idents, parent)
                         else:
                             del self.retries[msg_id]
                             # relay to client and update graph
                             self.handle_result(idents, parent, raw_msg, success)
                             # send to Hub monitor
                             self.mon_stream.send_multipart([b'outtask']+raw_msg, copy=False)
                     else:
                         self.handle_unmet_dependency(idents, parent)
                 def handle_result(self, idents, parent, raw_msg, success=True):
                     """handle a real task result, either success or failure"""
                     # first, relay result to client
                     engine = idents[0]
                     client = idents[1]
                     # swap_ids for ROUTER-ROUTER mirror
                     raw_msg[:2] = [client,engine]
                     # print (map(str, raw_msg[:4]))
                     self.client_stream.send_multipart(raw_msg, copy=False)
                     # now, update our data structures
                     msg_id = parent['msg_id']
                     self.pending[engine].pop(msg_id)
                     if success:
                         self.completed[engine].add(msg_id)
                         self.all_completed.add(msg_id)
                     else:
                         self.failed[engine].add(msg_id)
                         self.all_failed.add(msg_id)
                     self.all_done.add(msg_id)
                     self.destinations[msg_id] = engine
                     self.update_graph(msg_id, success)
                 def handle_unmet_dependency(self, idents, parent):
                     """handle an unmet dependency"""
                     engine = idents[0]
                     msg_id = parent['msg_id']
                     job = self.pending[engine].pop(msg_id)
                     job.blacklist.add(engine)
                     if job.blacklist == job.targets:
                         self.queue_map[msg_id] = job
                         self.fail_unreachable(msg_id)
                     elif not self.maybe_run(job):
                         # resubmit failed
                         if msg_id not in self.all_failed:
                             # put it back in our dependency tree
                             self.save_unmet(job)
                     if self.hwm:
                         try:
                             idx = self.targets.index(engine)
                         except ValueError:
                             pass # skip load-update for dead engines
                         else:
                             if self.loads[idx] == self.hwm-1:
                                 self.update_graph(None)
                 def update_graph(self, dep_id=None, success=True):
                     """dep_id just finished. Update our dependency
                     graph and submit any jobs that just became runnable.
                     Called with dep_id=None to update entire graph for hwm, but without finishing a task.
                     """
                     # print ("\n\n***********")
                     # pprint (dep_id)
                     # pprint (self.graph)
                     # pprint (self.queue_map)
                     # pprint (self.all_completed)
                     # pprint (self.all_failed)
                     # print ("\n\n***********\n\n")
                     # update any jobs that depended on the dependency
                     msg_ids = self.graph.pop(dep_id, [])
                     # recheck *all* jobs if
                     # a) we have HWM and an engine just become no longer full
                     # or b) dep_id was given as None
                     if dep_id is None or self.hwm and any( [ load==self.hwm-1 for load in self.loads ]):
                         jobs = self.queue
                         using_queue = True
                     else:
                         using_queue = False
-                        jobs = heapq.heapify([ self.queue_map[msg_id] for msg_id in msg_ids ])
+                        jobs = deque(sorted( self.queue_map[msg_id] for msg_id in msg_ids ))
                     to_restore = []
                     while jobs:
-                        job = heapq.heappop(jobs)
+                        job = jobs.popleft()
                         if job.removed:
                             continue
                         msg_id = job.msg_id
                         put_it_back = True
                         if job.after.unreachable(self.all_completed, self.all_failed)\
                                 or job.follow.unreachable(self.all_completed, self.all_failed):
                             self.fail_unreachable(msg_id)
                             put_it_back = False
                         elif job.after.check(self.all_completed, self.all_failed): # time deps met, maybe run
                             if self.maybe_run(job):
                                 put_it_back = False
                                 self.queue_map.pop(msg_id)
                                 for mid in job.dependents:
                                     if mid in self.graph:
                                         self.graph[mid].remove(msg_id)
                                 # abort the loop if we just filled up all of our engines.
                                 # avoids an O(N) operation in situation of full queue,
                                 # where graph update is triggered as soon as an engine becomes
                                 # non-full, and all tasks after the first are checked,
                                 # even though they can't run.
                                 if not self.available_engines():
                                     break
                         if using_queue and put_it_back:
                             # popped a job from the queue but it neither ran nor failed,
                             # so we need to put it back when we are done
+                            # make sure to_restore preserves the same ordering
                             to_restore.append(job)
                     # put back any tasks we popped but didn't run
-                    for job in to_restore:
+                    if using_queue:
-                        heapq.heappush(self.queue, job)
+                        self.queue.extendleft(to_restore)
                 #----------------------------------------------------------------------
                 # methods to be overridden by subclasses
                 #----------------------------------------------------------------------
                 def add_job(self, idx):
                     """Called after self.targets[idx] just got the job with header.
                     Override with subclasses.  The default ordering is simple LRU.
                     The default loads are the number of outstanding jobs."""
                     self.loads[idx] += 1
                     for lis in (self.targets, self.loads):
                         lis.append(lis.pop(idx))
                 def finish_job(self, idx):
                     """Called after self.targets[idx] just finished a job.
                     Override with subclasses."""
                     self.loads[idx] -= 1
             def launch_scheduler(in_addr, out_addr, mon_addr, not_addr, reg_addr, config=None,
                                     logname='root', log_url=None, loglevel=logging.DEBUG,
                                     identity=b'task', in_thread=False):
                 ZMQStream = zmqstream.ZMQStream
                 loglevel = logging.DEBUG
                 if config:
                     # unwrap dict back into Config
                     config = Config(config)
                 if in_thread:
                     # use instance() to get the same Context/Loop as our parent
                     ctx = zmq.Context.instance()
                     loop = ioloop.IOLoop.instance()
                 else:
                     # in a process, don't use instance()
                     # for safety with multiprocessing
                     ctx = zmq.Context()
                     loop = ioloop.IOLoop()
                 ins = ZMQStream(ctx.socket(zmq.ROUTER),loop)
                 ins.setsockopt(zmq.IDENTITY, identity + b'_in')
                 ins.bind(in_addr)
                 outs = ZMQStream(ctx.socket(zmq.ROUTER),loop)
                 outs.setsockopt(zmq.IDENTITY, identity + b'_out')
                 outs.bind(out_addr)
                 mons = zmqstream.ZMQStream(ctx.socket(zmq.PUB),loop)
                 mons.connect(mon_addr)
                 nots = zmqstream.ZMQStream(ctx.socket(zmq.SUB),loop)
                 nots.setsockopt(zmq.SUBSCRIBE, b'')
                 nots.connect(not_addr)
                 querys = ZMQStream(ctx.socket(zmq.DEALER),loop)
                 querys.connect(reg_addr)
                 # setup logging.
                 if in_thread:
                     log = Application.instance().log
                 else:
                     if log_url:
                         log = connect_logger(logname, ctx, log_url, root="scheduler", loglevel=loglevel)
                     else:
                         log = local_logger(logname, loglevel)
                 scheduler = TaskScheduler(client_stream=ins, engine_stream=outs,
                                         mon_stream=mons, notifier_stream=nots,
                                         query_stream=querys,
                                         loop=loop, log=log,
                                         config=config)
                 scheduler.start()
                 if not in_thread:
                     try:
                         loop.start()
                     except KeyboardInterrupt:
                         scheduler.log.critical("Interrupted, exiting...")