Context navigation

source: main/waeup.kofa/trunk/src/waeup/kofa/utils/batching.py @ 12813

Last change on this file since 12813 was 12811, checked in by Henrik Bettermann, 10 years ago
Take also whitespaces and ignore marker into consideration.
Property svn:keywords set to `Id`
File size: 28.8 KB

Rev	Line
[7196]	1	## $Id: batching.py 12811 2015-03-23 11:06:26Z henrik $
	2	##
	3	## Copyright (C) 2011 Uli Fouquet & Henrik Bettermann
	4	## This program is free software; you can redistribute it and/or modify
	5	## it under the terms of the GNU General Public License as published by
	6	## the Free Software Foundation; either version 2 of the License, or
	7	## (at your option) any later version.
	8	##
	9	## This program is distributed in the hope that it will be useful,
	10	## but WITHOUT ANY WARRANTY; without even the implied warranty of
	11	## MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
	12	## GNU General Public License for more details.
	13	##
	14	## You should have received a copy of the GNU General Public License
	15	## along with this program; if not, write to the Free Software
	16	## Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
	17	##
[7819]	18	"""Kofa components for batch processing.
[4806]	19
	20	Batch processors eat CSV files to add, update or remove large numbers
	21	of certain kinds of objects at once.
	22	"""
	23	import grok
[8380]	24	import datetime
[4821]	25	import os
[9217]	26	import shutil
[4900]	27	import tempfile
[4821]	28	import time
[10027]	29	import unicodecsv
[9816]	30	import zc.async.interfaces
[7859]	31	from cStringIO import StringIO
[9217]	32	from persistent.list import PersistentList
	33	from zope.component import createObject, getUtility
	34	from zope.component.hooks import setSite
[9726]	35	from zope.interface import Interface, implementer
[4806]	36	from zope.schema import getFields
[11849]	37	from zope.schema.interfaces import ConstraintNotSatisfied
[8332]	38	from zope.event import notify
[9217]	39	from waeup.kofa.async import AsyncJob
[7811]	40	from waeup.kofa.interfaces import (
[9217]	41	IBatchProcessor, FatalCSVError, IObjectConverter, IJobManager,
	42	ICSVExporter, IGNORE_MARKER, DuplicationError, JOB_STATUS_MAP,
[9726]	43	IExportJobContainer, IExportJob, IExportContainerFinder)
[4806]	44
	45	class BatchProcessor(grok.GlobalUtility):
	46	"""A processor to add, update, or remove data.
	47
	48	This is a non-active baseclass.
	49	"""
[8220]	50	grok.implements(IBatchProcessor)
[4806]	51	grok.context(Interface)
	52	grok.baseclass()
	53
	54	# Name used in pages and forms...
[7933]	55	name = u'Non-registered base processor'
[6259]	56
[4806]	57	# Internal name...
[7933]	58	util_name = 'baseprocessor'
[6259]	59
[4806]	60	# Items for this processor need an interface with zope.schema fields.
[5009]	61	iface = Interface
[6259]	62
[4806]	63	# The name must be the same as the util_name attribute in order to
	64	# register this utility correctly.
	65	grok.name(util_name)
	66
	67	# Headers needed to locate items...
	68	location_fields = ['code', 'faculty_code']
[6259]	69
[4806]	70	# A factory with this name must be registered...
	71	factory_name = 'waeup.Department'
	72
	73	@property
	74	def required_fields(self):
[4829]	75	"""Required fields that have no default.
	76
	77	A list of names of field, whose value cannot be set if not
	78	given during creation. Therefore these fields must exist in
	79	input.
	80
	81	Fields with a default != missing_value do not belong to this
	82	category.
	83	"""
[4806]	84	result = []
	85	for key, field in getFields(self.iface).items():
	86	if key in self.location_fields:
	87	continue
[4829]	88	if field.default is not field.missing_value:
	89	continue
[4806]	90	if field.required:
	91	result.append(key)
	92	return result
[6259]	93
[4806]	94	@property
	95	def req(self):
	96	result = dict(
	97	create = self.location_fields + self.required_fields,
	98	update = self.location_fields,
	99	remove = self.location_fields,
	100	)
	101	return result
	102
	103	@property
	104	def available_fields(self):
	105	return sorted(list(set(
	106	self.location_fields + getFields(self.iface).keys())))
[6259]	107
[4806]	108	def getHeaders(self, mode='create'):
	109	return self.available_fields
	110
	111	def checkHeaders(self, headerfields, mode='create'):
	112	req = self.req[mode]
	113	# Check for required fields...
	114	for field in req:
	115	if not field in headerfields:
	116	raise FatalCSVError(
	117	"Need at least columns %s for import!" %
	118	', '.join(["'%s'" % x for x in req]))
[6828]	119	# Check for double fields. Cannot happen because this error is
	120	# already catched in views
[4806]	121	not_ignored_fields = [x for x in headerfields
	122	if not x.startswith('--')]
	123	if len(set(not_ignored_fields)) < len(not_ignored_fields):
	124	raise FatalCSVError(
	125	"Double headers: each column name may only appear once.")
	126	return True
	127
	128	def applyMapping(self, row, mapping):
[4811]	129	"""Apply mapping to a row of CSV data.
[6824]	130
[4811]	131	"""
[4806]	132	result = dict()
	133	for key, replacement in mapping.items():
[6824]	134	if replacement == u'--IGNORE--':
	135	# Skip ignored columns in failed and finished data files.
	136	continue
[4806]	137	result[replacement] = row[key]
	138	return result
[6259]	139
[4832]	140	def getMapping(self, path, headerfields, mode):
[6824]	141	"""Get a mapping from CSV file headerfields to actually used fieldnames.
	142
[4811]	143	"""
[4832]	144	result = dict()
[10027]	145	reader = unicodecsv.reader(open(path, 'rb'))
[4806]	146	raw_header = reader.next()
[4832]	147	for num, field in enumerate(headerfields):
	148	if field not in self.location_fields and mode == 'remove':
[6824]	149	# Skip non-location fields when removing.
	150	continue
	151	if field == u'--IGNORE--':
	152	# Skip ignored columns in failed and finished data files.
	153	continue
[4832]	154	result[raw_header[num]] = field
	155	return result
[4806]	156
[6273]	157	def stringFromErrs(self, errors, inv_errors):
	158	result = []
	159	for err in errors:
	160	fieldname, message = err
	161	result.append("%s: %s" % (fieldname, message))
	162	for err in inv_errors:
	163	result.append("invariant: %s" % err)
	164	return '; '.join(result)
	165
[4806]	166	def callFactory(self, args, *kw):
	167	return createObject(self.factory_name)
	168
	169	def parentsExist(self, row, site):
[4811]	170	"""Tell whether the parent object for data in ``row`` exists.
	171	"""
[4806]	172	raise NotImplementedError('method not implemented')
	173
	174	def entryExists(self, row, site):
[4811]	175	"""Tell whether there already exists an entry for ``row`` data.
	176	"""
[4806]	177	raise NotImplementedError('method not implemented')
	178
	179	def getParent(self, row, site):
[4811]	180	"""Get the parent object for the entry in ``row``.
	181	"""
[4806]	182	raise NotImplementedError('method not implemented')
[6259]	183
[5009]	184	def getEntry(self, row, site):
[12513]	185	"""Get the object for the entry in ``row``.
[5009]	186	"""
	187	raise NotImplementedError('method not implemented')
[6259]	188
[4806]	189	def addEntry(self, obj, row, site):
[4811]	190	"""Add the entry given given by ``row`` data.
	191	"""
[4806]	192	raise NotImplementedError('method not implemented')
	193
	194	def delEntry(self, row, site):
[4811]	195	"""Delete entry given by ``row`` data.
	196	"""
[6259]	197	raise NotImplementedError('method not implemented')
[4806]	198
[7950]	199	def checkUpdateRequirements(self, obj, row, site):
	200	"""Checks requirements the object must fulfill when being updated.
[7938]	201
	202	This method is not used in case of deleting or adding objects.
	203
[7950]	204	Returns error messages as strings in case of requirement
[7938]	205	problems.
[7937]	206	"""
[7938]	207	return None
[7937]	208
[9706]	209	def updateEntry(self, obj, row, site, filename):
[4984]	210	"""Update obj to the values given in row.
[8220]	211
	212	Returns a string describing the fields changed.
[4984]	213	"""
[8220]	214	changed = []
[4829]	215	for key, value in row.items():
[8220]	216	# Skip fields to be ignored.
	217	if value == IGNORE_MARKER:
	218	continue
[8304]	219	# Skip fields not declared in interface and which are
	220	# not yet attributes of existing objects. We can thus not
	221	# add non-existing attributes here.
[8220]	222	if not hasattr(obj, key):
	223	continue
[9265]	224	try:
	225	setattr(obj, key, value)
	226	except AttributeError:
	227	# Computed attributes can't be set.
	228	continue
[8222]	229	log_value = getattr(value, 'code', value)
	230	changed.append('%s=%s' % (key, log_value))
[8332]	231
[8333]	232	# If any catalog is involved it must be updated.
	233	#
	234	# XXX: The event is also triggered when creating objects as
	235	# updateEntry is called also when creating entries resulting
	236	# in objectAdded and additional objectModified events.
	237	if len(changed):
	238	notify(grok.ObjectModifiedEvent(obj))
[8332]	239
[8220]	240	return ', '.join(changed)
[4821]	241
[4832]	242	def createLogfile(self, path, fail_path, num, warnings, mode, user,
[4885]	243	timedelta, logger=None):
	244	"""Write to log file.
[4821]	245	"""
[4885]	246	if logger is None:
	247	return
[9739]	248	logger.info(
	249	"processed: %s, %s mode, %s lines (%s successful/ %s failed), "
	250	"%0.3f s (%0.4f s/item)" % (
	251	path, mode, num, num - warnings, warnings,
	252	timedelta, timedelta/(num or 1)))
[4821]	253	return
[4877]	254
	255	def writeFailedRow(self, writer, row, warnings):
	256	"""Write a row with error messages to error CSV.
	257
	258	If warnings is a list of strings, they will be concatenated.
	259	"""
	260	error_col = warnings
	261	if isinstance(warnings, list):
	262	error_col = ' / '.join(warnings)
	263	row['--ERRORS--'] = error_col
	264	writer.writerow(row)
	265	return
[6259]	266
[8220]	267	def checkConversion(self, row, mode='ignore', ignore_empty=True):
[6847]	268	"""Validates all values in row.
	269	"""
	270	converter = IObjectConverter(self.iface)
	271	errs, inv_errs, conv_dict = converter.fromStringDict(
[8220]	272	row, self.factory_name, mode=mode)
[6847]	273	return errs, inv_errs, conv_dict
	274
[12810]	275
	276	def emptyRow(self, row):
	277	"""Detect empty rows.
	278	"""
	279	for value in row.values():
[12811]	280	if value.strip() and not value in (None, IGNORE_MARKER):
[12810]	281	return False
	282	return True
	283
[4885]	284	def doImport(self, path, headerfields, mode='create', user='Unknown',
[8220]	285	logger=None, ignore_empty=True):
[4811]	286	"""Perform actual import.
	287	"""
[4832]	288	time_start = time.time()
[4806]	289	self.checkHeaders(headerfields, mode)
[4832]	290	mapping = self.getMapping(path, headerfields, mode)
[10027]	291	reader = unicodecsv.DictReader(open(path, 'rb'))
[4889]	292
[4900]	293	temp_dir = tempfile.mkdtemp()
[6259]	294
[6273]	295	base = os.path.basename(path)
	296	(base, ext) = os.path.splitext(base)
[4900]	297	failed_path = os.path.join(temp_dir, "%s.pending%s" % (base, ext))
[6831]	298	failed_headers = mapping.values()
[4877]	299	failed_headers.append('--ERRORS--')
[10027]	300	failed_writer = unicodecsv.DictWriter(open(failed_path, 'wb'),
	301	failed_headers)
[8573]	302	os.chmod(failed_path, 0664)
[6831]	303	failed_writer.writerow(dict([(x,x) for x in failed_headers]))
[4891]	304
[4900]	305	finished_path = os.path.join(temp_dir, "%s.finished%s" % (base, ext))
[6831]	306	finished_headers = mapping.values()
[10027]	307	finished_writer = unicodecsv.DictWriter(open(finished_path, 'wb'),
	308	finished_headers)
[8905]	309	os.chmod(finished_path, 0664)
[4891]	310	finished_writer.writerow(dict([(x,x) for x in finished_headers]))
[6259]	311
[4806]	312	num =0
[4878]	313	num_warns = 0
[4806]	314	site = grok.getSite()
[7859]	315
[4806]	316	for raw_row in reader:
	317	num += 1
[12810]	318	# Skip row if empty
	319	if self.emptyRow(raw_row):
	320	continue
[4806]	321	string_row = self.applyMapping(raw_row, mapping)
[8222]	322	if ignore_empty and mode in ('update',):
[12810]	323	# Replace empty strings with ignore-markers
[8222]	324	for key, val in string_row.items():
[8220]	325	if val == '':
[8222]	326	string_row[key] = IGNORE_MARKER
	327	row = dict(string_row.items()) # create deep copy
[6847]	328	errs, inv_errs, conv_dict = self.checkConversion(string_row, mode)
[6273]	329	if errs or inv_errs:
[4878]	330	num_warns += 1
[6273]	331	conv_warnings = self.stringFromErrs(errs, inv_errs)
	332	self.writeFailedRow(
[6824]	333	failed_writer, string_row, conv_warnings)
[4821]	334	continue
[6273]	335	row.update(conv_dict)
[6259]	336
[4806]	337	if mode == 'create':
	338	if not self.parentsExist(row, site):
[4878]	339	num_warns += 1
[4877]	340	self.writeFailedRow(
[6824]	341	failed_writer, string_row,
[4877]	342	"Not all parents do exist yet. Skipping")
[4806]	343	continue
	344	if self.entryExists(row, site):
[4878]	345	num_warns += 1
[4877]	346	self.writeFailedRow(
[6824]	347	failed_writer, string_row,
[8330]	348	"This object already exists. Skipping.")
[4806]	349	continue
	350	obj = self.callFactory()
[7273]	351	# Override all values in row, also
	352	# student_ids and applicant_ids which have been
	353	# generated in the respective __init__ methods before.
[9706]	354	self.updateEntry(obj, row, site, base)
[6243]	355	try:
	356	self.addEntry(obj, row, site)
[6273]	357	except KeyError, error:
[6219]	358	num_warns += 1
	359	self.writeFailedRow(
[6824]	360	failed_writer, string_row,
[6273]	361	"%s Skipping." % error.message)
[8540]	362	continue
[8509]	363	except DuplicationError, error:
	364	num_warns += 1
	365	self.writeFailedRow(
	366	failed_writer, string_row,
	367	"%s Skipping." % error.msg)
[6219]	368	continue
[4806]	369	elif mode == 'remove':
	370	if not self.entryExists(row, site):
[4878]	371	num_warns += 1
[4877]	372	self.writeFailedRow(
[6824]	373	failed_writer, string_row,
[9219]	374	"Cannot remove: no such entry")
[4806]	375	continue
	376	self.delEntry(row, site)
	377	elif mode == 'update':
	378	obj = self.getEntry(row, site)
	379	if obj is None:
[4878]	380	num_warns += 1
[4877]	381	self.writeFailedRow(
[6824]	382	failed_writer, string_row,
[9219]	383	"Cannot update: no such entry")
[4806]	384	continue
[7950]	385	update_errors = self.checkUpdateRequirements(obj, row, site)
[7938]	386	if update_errors is not None:
[7937]	387	num_warns += 1
	388	self.writeFailedRow(
	389	failed_writer, string_row, update_errors)
	390	continue
[11849]	391	try:
	392	self.updateEntry(obj, row, site, base)
	393	except ConstraintNotSatisfied, err:
	394	num_warns += 1
	395	self.writeFailedRow(
	396	failed_writer, string_row,
	397	"ConstraintNotSatisfied: %s" % err)
	398	continue
[4891]	399	finished_writer.writerow(string_row)
[4821]	400
[4832]	401	time_end = time.time()
	402	timedelta = time_end - time_start
[6259]	403
[4878]	404	self.createLogfile(path, failed_path, num, num_warns, mode, user,
[4885]	405	timedelta, logger=logger)
[4894]	406	failed_path = os.path.abspath(failed_path)
[4878]	407	if num_warns == 0:
[4821]	408	del failed_writer
	409	os.unlink(failed_path)
[4894]	410	failed_path = None
	411	return (num, num_warns,
	412	os.path.abspath(finished_path), failed_path)
[7859]	413
[9032]	414	def get_csv_skeleton(self):
	415	"""Export CSV file only with a header of available fields.
	416
	417	A raw string with CSV data should be returned.
	418	"""
	419	outfile = StringIO()
[10027]	420	writer = unicodecsv.DictWriter(outfile, self.available_fields)
[9734]	421	writer.writerow(
	422	dict(zip(self.available_fields, self.available_fields))) # header
[9032]	423	outfile.seek(0)
	424	return outfile.read()
	425
[7859]	426	class ExporterBase(object):
	427	"""A base for exporters.
	428	"""
	429	grok.implements(ICSVExporter)
	430
	431	#: Fieldnames considered by this exporter
	432	fields = ('code', 'title', 'title_prefix')
	433
[7907]	434	#: The title under which this exporter will be displayed
	435	#: (if registered as a utility)
	436	title = 'Override this title'
	437
[7859]	438	def mangle_value(self, value, name, context=None):
	439	"""Hook for mangling values in derived classes
	440	"""
	441	if isinstance(value, bool):
	442	value = value and '1' or '0'
	443	elif isinstance(value, unicode):
	444	# CSV writers like byte streams better than unicode
	445	value = value.encode('utf-8')
[8380]	446	elif isinstance(value, datetime.datetime):
[11737]	447	#value = str(value)
	448	value = str('%s#' % value) # changed 2014-07-06, see ticket #941
[8380]	449	elif isinstance(value, datetime.date):
	450	# Order is important here: check for date after datetime as
	451	# datetimes are also dates.
	452	#
	453	# Append hash '#' to dates to circumvent unwanted excel automatic
	454	value = str('%s#' % value)
[7859]	455	elif value is None:
	456	# None is not really representable in CSV files
	457	value = ''
	458	return value
	459
	460	def get_csv_writer(self, filepath=None):
	461	"""Get a CSV dict writer instance open for writing.
	462
	463	Returns a tuple (<writer>, <outfile>) where ``<writer>`` is a
	464	:class:`csv.DictWriter` instance and outfile is the real file
	465	which is written to. The latter is important when writing to
	466	StringIO and can normally be ignored otherwise.
	467
	468	The returned file will already be filled with the header row.
	469
	470	Please note that if you give a filepath, the returned outfile
	471	is open for writing only and you might have to close it before
	472	reopening it for reading.
	473	"""
	474	if filepath is None:
	475	outfile = StringIO()
	476	else:
	477	outfile = open(filepath, 'wb')
[10027]	478	writer = unicodecsv.DictWriter(outfile, self.fields)
[7859]	479	writer.writerow(dict(zip(self.fields, self.fields))) # header
	480	return writer, outfile
	481
	482	def write_item(self, obj, writer):
	483	"""Write a row extracted from `obj` into CSV file using `writer`.
	484	"""
	485	row = {}
	486	for name in self.fields:
	487	value = getattr(obj, name, None)
	488	value = self.mangle_value(value, name, obj)
	489	row[name] = value
	490	writer.writerow(row)
	491	return
	492
	493	def close_outfile(self, filepath, outfile):
	494	"""Close outfile.
	495
	496	If filepath is None, the contents of outfile is returned.
	497	"""
	498	outfile.seek(0)
	499	if filepath is None:
	500	return outfile.read()
	501	outfile.close()
	502	return
	503
[9797]	504	def get_filtered(self, site, **kw):
	505	"""Get datasets to export filtered by keyword arguments.
	506
	507	Returns an iterable.
	508	"""
	509	raise NotImplementedError
	510
[12516]	511	def get_selected(self, site, selected):
	512	"""Get datasets to export for selected items
	513	specified by a list of identifiers.
	514
	515	Returns an iterable.
	516	"""
	517	raise NotImplementedError
	518
[7859]	519	def export(self, iterable, filepath=None):
	520	"""Export `iterable` as CSV file.
	521
	522	If `filepath` is ``None``, a raw string with CSV data should
	523	be returned.
	524	"""
	525	raise NotImplementedError
	526
	527	def export_all(self, site, filepath=None):
	528	"""Export all appropriate objects in `site` into `filepath` as
	529	CSV data.
	530
	531	If `filepath` is ``None``, a raw string with CSV data should
	532	be returned.
	533	"""
	534	raise NotImplementedError
[9217]	535
[9797]	536	def export_filtered(self, site, filepath=None, **kw):
	537	"""Export items denoted by `args` and `kw`.
[9217]	538
[9797]	539	If `filepath` is ``None``, a raw string with CSV data should
	540	be returned.
	541	"""
	542	data = self.get_filtered(site, **kw)
	543	return self.export(data, filepath=filepath)
	544
[12516]	545	def export_selected(self, site, filepath=None, **kw):
	546	"""Export those items specified by a list of identifiers
	547	called `selected`.
	548
	549	If `filepath` is ``None``, a raw string with CSV data should
	550	be returned.
	551	"""
	552	selected = kw.get('selected', [])
	553	data = self.get_selected(site, selected)
	554	return self.export(data, filepath=filepath)
	555
[9797]	556	def export_job(site, exporter_name, **kw):
[9217]	557	"""Export all entries delivered by exporter and store it in a temp file.
	558
	559	`site` gives the site to search. It will be passed to the exporter
	560	and also be set as 'current site' as the function is used in
	561	asynchronous jobs which run in their own threads and have no site
	562	set initially. Therefore `site` must also be a valid value for use
	563	with `zope.component.hooks.setSite()`.
	564
	565	`exporter_name` is the utility name under which the desired
	566	exporter was registered with the ZCA.
	567
	568	The resulting CSV file will be stored in a new temporary directory
	569	(using :func:`tempfile.mkdtemp`). It will be named after the
	570	exporter used with `.csv` filename extension.
	571
	572	Returns the path to the created CSV file.
	573
	574	.. note:: It is the callers responsibility to clean up the used
	575	file and its parent directory.
	576	"""
	577	setSite(site)
	578	exporter = getUtility(ICSVExporter, name=exporter_name)
	579	output_dir = tempfile.mkdtemp()
	580	filename = '%s.csv' % exporter_name
	581	output_path = os.path.join(output_dir, filename)
[9797]	582	if kw == {}:
	583	exporter.export_all(site, filepath=output_path)
[12516]	584	elif kw.has_key('selected'):
	585	exporter.export_selected(site, filepath=output_path, **kw)
[9797]	586	else:
	587	exporter.export_filtered(site, filepath=output_path, **kw)
[9217]	588	return output_path
	589
	590	class AsyncExportJob(AsyncJob):
	591	"""An IJob that exports data to CSV files.
	592
	593	`AsyncExportJob` instances are regular `AsyncJob` instances with a
	594	different constructor API. Instead of a callable to execute, you
	595	must pass a `site` and some `exporter_name` to trigger an export.
	596
	597	The real work is done when an instance of this class is put into a
	598	queue. See :mod:`waeup.kofa.async` to learn more about
	599	asynchronous jobs.
	600
	601	The `exporter_name` must be the name under which an ICSVExporter
	602	utility was registered with the ZCA.
	603
	604	The `site` must be a valid site or ``None``.
	605
	606	The result of an `AsyncExportJob` is the path to generated CSV
	607	file. The file will reside in a temporary directory that should be
	608	removed after being used.
	609	"""
	610	grok.implements(IExportJob)
	611
[9718]	612	def __init__(self, site, exporter_name, args, *kwargs):
[9217]	613	super(AsyncExportJob, self).__init__(
[9718]	614	export_job, site, exporter_name, args, *kwargs)
[9217]	615
[9816]	616	@property
	617	def finished(self):
	618	"""A job is marked `finished` if it is completed.
	619
	620	Please note: a finished report job does not neccessarily
	621	provide an IReport result. See meth:`failed`.
	622	"""
	623	return self.status == zc.async.interfaces.COMPLETED
	624
	625	@property
	626	def failed(self):
	627	"""A report job is marked failed iff it is finished and the
	628	result is None.
	629
	630	While a job is unfinished, the `failed` status is ``None``.
	631
	632	Failed jobs normally provide a `traceback` to examine reasons.
	633	"""
	634	if not self.finished:
	635	return None
	636	if getattr(self, 'result', None) is None:
	637	return True
	638	return False
	639
[9217]	640	class ExportJobContainer(object):
	641	"""A mix-in that provides functionality for asynchronous export jobs.
	642	"""
	643	grok.implements(IExportJobContainer)
	644	running_exports = PersistentList()
	645
[9718]	646	def start_export_job(self, exporter_name, user_id, args, *kwargs):
[9217]	647	"""Start asynchronous export job.
	648
	649	`exporter_name` is the name of an exporter utility to be used.
	650
	651	`user_id` is the ID of the user that triggers the export.
	652
	653	The job_id is stored along with exporter name and user id in a
	654	persistent list.
	655
[9718]	656	The method supports additional positional and keyword
	657	arguments, which are passed as-is to the respective
	658	:class:`AsyncExportJob`.
	659
[9217]	660	Returns the job ID of the job started.
	661	"""
	662	site = grok.getSite()
	663	manager = getUtility(IJobManager)
[9718]	664	job = AsyncExportJob(site, exporter_name, args, *kwargs)
[9217]	665	job_id = manager.put(job)
	666	# Make sure that the persisted list is stored in ZODB
	667	self.running_exports = PersistentList(self.running_exports)
	668	self.running_exports.append((job_id, exporter_name, user_id))
	669	return job_id
	670
	671	def get_running_export_jobs(self, user_id=None):
	672	"""Get export jobs for user with `user_id` as list of tuples.
	673
	674	Each tuples holds ``<job_id>, <exporter_name>, <user_id>`` in
	675	that order. The ``<exporter_name>`` is the utility name of the
	676	used exporter.
	677
	678	If `user_id` is ``None``, all running jobs are returned.
	679	"""
	680	entries = []
	681	to_delete = []
	682	manager = getUtility(IJobManager)
	683	for entry in self.running_exports:
	684	if user_id is not None and entry[2] != user_id:
	685	continue
	686	if manager.get(entry[0]) is None:
	687	to_delete.append(entry)
	688	continue
	689	entries.append(entry)
	690	if to_delete:
	691	self.running_exports = PersistentList(
	692	[x for x in self.running_exports if x not in to_delete])
	693	return entries
	694
	695	def get_export_jobs_status(self, user_id=None):
	696	"""Get running/completed export jobs for `user_id` as list of tuples.
	697
	698	Each tuple holds ``<raw status>, <status translated>,
	699	<exporter title>`` in that order, where ``<status
	700	translated>`` and ``<exporter title>`` are translated strings
	701	representing the status of the job and the human readable
	702	title of the exporter used.
	703	"""
	704	entries = self.get_running_export_jobs(user_id)
	705	result = []
	706	manager = getUtility(IJobManager)
	707	for entry in entries:
	708	job = manager.get(entry[0])
	709	if job is None:
	710	continue
	711	status, status_translated = JOB_STATUS_MAP[job.status]
	712	exporter_name = getUtility(ICSVExporter, name=entry[1]).title
	713	result.append((status, status_translated, exporter_name))
	714	return result
	715
	716	def delete_export_entry(self, entry):
	717	"""Delete the export denoted by `entry`.
	718
	719	Removes given entry from the local `running_exports` list and also
	720	removes the regarding job via the local job manager.
	721
	722	`entry` must be a tuple ``(<job id>, <exporter name>, <user
	723	id>)`` as created by :meth:`start_export_job` or returned by
	724	:meth:`get_running_export_jobs`.
	725	"""
	726	manager = getUtility(IJobManager)
	727	job = manager.get(entry[0])
	728	if job is not None:
	729	# remove created export file
	730	if isinstance(job.result, basestring):
	731	if os.path.exists(os.path.dirname(job.result)):
	732	shutil.rmtree(os.path.dirname(job.result))
	733	manager.remove(entry[0], self)
	734	new_entries = [x for x in self.running_exports
	735	if x != entry]
	736	self.running_exports = PersistentList(new_entries)
	737	return
	738
	739	def entry_from_job_id(self, job_id):
	740	"""Get entry tuple for `job_id`.
	741
	742	Returns ``None`` if no such entry can be found.
	743	"""
	744	for entry in self.running_exports:
	745	if entry[0] == job_id:
	746	return entry
	747	return None
[9726]	748
	749	class VirtualExportJobContainer(ExportJobContainer):
	750	"""A virtual export job container.
	751
	752	Virtual ExportJobContainers can be used as a mixin just like real
	753	ExportJobContainer.
	754
	755	They retrieve and store data in the site-wide ExportJobContainer.
	756
	757	Functionality is currently entirely as for regular
	758	ExportJobContainers, except that data is stored elsewhere.
	759
	760	VirtualExportJobContainers need a registered
	761	IExportContainerFinder utility to find a suitable container for
	762	storing data.
	763	"""
	764	grok.implements(IExportJobContainer)
	765
	766	@property
	767	def _site_container(self):
	768	return getUtility(IExportContainerFinder)()
	769
	770	# The following is a simple trick. While ExportJobContainers store
	771	# only one attribute in ZODB, it is sufficient to replace this
	772	# attribute `running_exports` with a suitable manager to make the
	773	# whole virtual container work like the original but with the data
	774	# stored in the site-wide exports container. This way, virtual
	775	# export containers provide the whole functionality of a regular
	776	# exports container but store no data at all with themselves.
	777	@property
	778	def running_exports(self):
	779	"""Exports stored in the site-wide exports container.
	780	"""
	781	return self._site_container.running_exports
	782
	783	@running_exports.setter
	784	def running_exports(self, value):
	785	self._site_container.running_exports = value
	786
	787	@running_exports.deleter
	788	def running_exports(self):
	789	del self._site_container.running_exports
	790
[9823]	791	@property
	792	def logger(self):
	793	return self._site_container.logger
[9726]	794
	795	@implementer(IExportContainerFinder)
	796	class ExportContainerFinder(grok.GlobalUtility):
	797	"""Finder for local (site-wide) export container.
	798	"""
	799
	800	def __call__(self):
	801	"""Get the local export container-
	802
	803	If no site can be determined or the site provides no export
	804	container, None is returned.
	805	"""
	806	site = grok.getSite()
	807	if site is None:
	808	return None
	809	return site.get('datacenter', None)

Note: See TracBrowser for help on using the repository browser.

Download in other formats: