python-task-queue/taskqueue/taskqueue.py at master · morristech/python-task-queue

History

378 lines (301 loc) · 10.1 KB

Raw

100

101

102

103

104

105

106

107

108

109

110

111

112

113

114

115

116

117

118

119

120

121

122

123

124

125

126

127

128

129

130

131

132

133

134

135

136

137

138

139

140

141

142

143

144

145

146

147

148

149

150

151

152

153

154

155

156

157

158

159

160

161

162

163

164

165

166

167

168

169

170

171

172

173

174

175

176

177

178

179

180

181

182

183

184

185

186

187

188

189

190

191

192

193

194

195

196

197

198

199

200

201

202

203

204

205

206

207

208

209

210

211

212

213

214

215

216

217

218

219

220

221

222

223

224

225

226

227

228

229

230

231

232

233

234

235

236

237

238

239

240

241

242

243

244

245

246

247

248

249

250

251

252

253

254

255

256

257

258

259

260

261

262

263

264

265

266

267

268

269

270

271

272

273

274

275

276

277

278

279

280

281

282

283

284

285

286

287

288

289

290

291

292

293

294

295

296

297

298

299

300

301

302

303

304

305

306

307

308

309

310

311

312

313

314

315

316

317

318

319

320

321

322

323

324

325

326

327

328

329

330

331

332

333

334

335

336

337

338

339

340

341

342

343

344

345

346

347

348

349

350

351

352

353

354

355

356

357

358

359

360

361

362

363

364

365

366

367

368

369

370

371

372

373

374

375

376

377

378

from __future__ import print_function

import six

from functools import partial

import json

import random

import signal

import time

import traceback

import concurrent.futures

import multiprocessing as mp

import numpy as np

from tqdm import tqdm

from cloudvolume.threaded_queue import ThreadedQueue

from .aws_queue_api import AWSTaskQueueAPI

from .registered_task import RegisteredTask, deserialize

from .secrets import (

PROJECT_NAME, QUEUE_NAME, QUEUE_TYPE,

AWS_DEFAULT_REGION

)

def totask(task):

taskobj = deserialize(task['payload'])

taskobj._id = task['id']

return taskobj

LEASE_SECONDS = 300

class TaskQueue(ThreadedQueue):

"""

The standard usage is that a client calls lease to get the next available task,

performs that task, and then calls task.delete on that task before the lease expires.

If the client cannot finish the task before the lease expires,

and has a reasonable chance of completing the task,

it should call task.update before the lease expires.

If the client completes the task after the lease has expired,

it still needs to delete the task.

Tasks should be designed to be idempotent to avoid errors

if multiple clients complete the same task.

"""

class QueueEmpty(LookupError):

def __init__(self):

super(LookupError, self).__init__('Queue Empty')

def __init__(

self, queue_name=QUEUE_NAME, queue_server=QUEUE_TYPE,

region=None, qurl=None, n_threads=40, project=PROJECT_NAME

self._project = project

self._region = region

self._queue_name = queue_name

self._queue_server = queue_server

self._qurl = qurl

self._api = self._initialize_interface()

super(TaskQueue, self).__init__(n_threads) # creates self._queue

@property

def queue_name(self):

return self._queue_name

@property

def queue_server(self):

return self._queue_server

# This is key to making sure threading works. Don't refactor this method away.

def _initialize_interface(self):

server = self._queue_server.lower()

if server in ('pull-queue', 'google'):

return NotImplementedError("Google Cloud Tasks are not supported at this time.")

elif server in ('sqs', 'aws'):

qurl = self._qurl if self._qurl else self._queue_name

region = self._region if self._region else AWS_DEFAULT_REGION

return AWSTaskQueueAPI(qurl=qurl, region_name=region)

else:

raise NotImplementedError('Unknown server ' + self._queue_server)

@property

def enqueued(self):

"""

Returns the approximate(!) number of tasks enqueued in the cloud.

WARNING: The number computed by Google is eventually

consistent. It may return impossible numbers that

are small deviations from the number in the queue.

For instance, we've seen 1005 enqueued after 1000

inserts.

Returns: (int) number of tasks in cloud queue

"""

return self._api.enqueued

def insert(self, task):

"""

Insert a task into an existing queue.

"""

body = {

"payload": task.payload(),

"queueName": self._queue_name,

"groupByTag": True,

"tag": task.__class__.__name__

}

def cloud_insertion(api):

api.insert(body)

if len(self._threads):

self.put(cloud_insertion)

else:

cloud_insertion(self._api)

return self

def status(self):

"""

Gets information about the TaskQueue

"""

return self._api.get(getStats=True)

def get_task(self, tid):

"""

Gets the named task in the TaskQueue.

tid is a unique string Google provides

e.g. '7c6e81c9b7ab23f0'

"""

return self._api.get(tid)

def list(self):

"""

Lists all non-deleted Tasks in a TaskQueue,

whether or not they are currently leased, up to a maximum of 100.

"""

return [ totask(x) for x in self._api.list() ]

def renew_lease(self, task, seconds):

"""Update the duration of a task lease."""

return self._api.renew_lease(task, seconds)

def cancel_lease(self, task):

return self._api.cancel_lease(task)

def lease(self, seconds=600, num_tasks=1, tag=None):

"""

Acquires a lease on the topmost N unowned tasks in the specified queue.

Required query parameters: leaseSecs, numTasks

"""

tag = tag if tag else None

tasks = self._api.lease(

numTasks=num_tasks,

seconds=seconds,

groupByTag=(tag is not None),

tag=tag,

)

if not len(tasks):

raise TaskQueue.QueueEmpty

task = tasks[0]

return totask(task)

def patch(self):

"""

Update tasks that are leased out of a TaskQueue.

Required query parameters: newLeaseSeconds

"""

raise NotImplemented

def purge(self):

"""Deletes all tasks in the queue."""

try:

return self._api.purge()

except AttributeError:

while True:

lst = self.list()

if len(lst) == 0:

break

for task in lst:

self.delete(task)

self.wait()

return self

def acknowledge(self, task_id):

if isinstance(task_id, RegisteredTask):

task_id = task_id.id

def cloud_delete(api):

api.acknowledge(task_id)

if len(self._threads):

self.put(cloud_delete)

else:

cloud_delete(self._api)

return self

def delete(self, task_id):

"""Deletes a task from a TaskQueue."""

if isinstance(task_id, RegisteredTask):

task_id = task_id.id

def cloud_delete(api):

api.delete(task_id)

if len(self._threads):

self.put(cloud_delete)

else:

cloud_delete(self._api)

return self

def poll(

self, lease_seconds=LEASE_SECONDS, tag=None,

verbose=False, execute_args=[], execute_kwargs={},

stop_fn=None, backoff_exceptions=[], min_backoff_window=30,

max_backoff_window=120, log_fn=None

"""

Poll a queue until a stop condition is reached (default forever). Note

that this function is not thread safe as it requires a global variable

to intercept SIGINT.

lease_seconds: each task should be leased for this many seconds

tag: if specified, query for only tasks that match this tag

execute_args / execute_kwargs: pass these arguments to task execution

backoff_exceptions: A list of exceptions that instead of causing a crash,

instead cause the polling to back off for an increasing exponential

random window.

min_backoff_window: The minimum sized window (in seconds) to select a

random backoff time.

max_backoff_window: The window doubles each retry. This is the maximum value

in seconds.

stop_fn: A boolean returning function that accepts no parameters. When

it returns True, the task execution loop will terminate. It is evaluated

once after every task.

log_fn: Feed error messages to this function, default print (when verbose is enabled).

verbose: print out the status of each step

Return: number of tasks executed

"""

global LOOP

if not callable(stop_fn) and stop_fn is not None:

raise ValueError("stop_fn must be a callable. " + str(stop_fn))

elif not callable(stop_fn):

stop_fn = lambda: False

def random_exponential_window_backoff(n):

n = min(n, min_backoff_window)

# 120 sec max b/c on avg a request every ~250msec if 500 containers

# in contention which seems like a quite reasonable volume of traffic

# to handle

high = min(2 ** n, max_backoff_window)

return random.uniform(0, high)

def printv(*args, **kwargs):

if verbose:

print(*args, **kwargs)

LOOP = True

def sigint_handler(signum, frame):

global LOOP

printv("Interrupted. Exiting after this task completes...")

LOOP = False

prev_sigint_handler = signal.getsignal(signal.SIGINT)

signal.signal(signal.SIGINT, sigint_handler)

if log_fn is None:

log_fn = printv

tries = 0

executed = 0

backoff = False

backoff_exceptions = tuple(list(backoff_exceptions) + [ TaskQueue.QueueEmpty ])

while LOOP:

task = 'unknown' # for error message prior to leasing

try:

task = self.lease(seconds=int(lease_seconds))

tries += 1

printv(task)

task.execute(*execute_args, **execute_kwargs)

executed += 1

printv("Delete enqueued task...")

self.delete(task)

log_fn('INFO', task , "succesfully executed")

tries = 0

except backoff_exceptions:

backoff = True

except Exception as e:

printv('ERROR', task, "raised {}\n {}".format(e , traceback.format_exc()))

raise #this will restart the container in kubernetes

if stop_fn():

break

if backoff:

time.sleep(random_exponential_window_backoff(tries))

backoff = False

printv("Task execution loop exited.")

signal.signal(signal.SIGINT, prev_sigint_handler)

return executed

def block_until_empty(self, interval_sec=2):

while self.enqueued > 0:

time.sleep(interval_sec)

class MockTaskQueue(object):

def __init__(self, *args, **kwargs):

pass

def insert(self, task):

task.execute()

del task

def poll(self, *args, **kwargs):

return self

def wait(self, progress=None):

return self

def kill_threads(self):

return self

def __enter__(self):

return self

def __exit__(self, exception_type, exception_value, traceback):

pass

class LocalTaskQueue(object):

def __init__(self, parallel=1, queue_name='', queue_server='', progress=True):

if parallel and type(parallel) == bool:

parallel = mp.cpu_count()

self.parallel = parallel

self.queue = []

self.progress = progress

def insert(self, task):

self.queue.append(task)

def wait(self, progress=None):

return self

def poll(self, *args, **kwargs):

pass

def kill_threads(self):

return self

def __enter__(self):

return self

def __exit__(self, exception_type, exception_value, traceback):

with tqdm(total=len(self.queue), desc="Tasks") as pbar:

with concurrent.futures.ProcessPoolExecutor(max_workers=self.parallel) as executor:

for _ in executor.map(task_execute, self.queue):

pbar.update()

self.queue = []

# Necessary to define here to make the

# function picklable

def task_execute(task):

task.execute()

Provide feedback

Saved searches

Use saved searches to filter your results more quickly

FilesExpand file tree

taskqueue.py

Latest commit

History

taskqueue.py

File metadata and controls