Context navigation

source: main/waeup.ikoba/trunk/src/waeup/ikoba/customers/batching.py @ 12220

Last change on this file since 12220 was 12212, checked in by Henrik Bettermann, 11 years ago
Remove unused lists and tuples.
Property svn:keywords set to `Id`
File size: 21.6 KB

Line
1	## $Id: batching.py 12212 2014-12-13 09:36:29Z henrik $
2	##
3	## Copyright (C) 2014 Uli Fouquet & Henrik Bettermann
4	## This program is free software; you can redistribute it and/or modify
5	## it under the terms of the GNU General Public License as published by
6	## the Free Software Foundation; either version 2 of the License, or
7	## (at your option) any later version.
8	##
9	## This program is distributed in the hope that it will be useful,
10	## but WITHOUT ANY WARRANTY; without even the implied warranty of
11	## MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
12	## GNU General Public License for more details.
13	##
14	## You should have received a copy of the GNU General Public License
15	## along with this program; if not, write to the Free Software
16	## Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
17	##
18	"""Batch processing components for customer objects.
19
20	Batch processors eat CSV files to add, update or remove large numbers
21	of certain kinds of objects at once.
22
23	Here we define the processors for customers specific objects like
24	customers and subobjects.
25	"""
26	import grok
27	import unicodecsv as csv # XXX: csv ops should move to dedicated module.
28	from time import time
29	from datetime import datetime
30	from zope.i18n import translate
31	from zope.interface import Interface
32	from zope.schema import getFields
33	from zope.component import queryUtility, getUtility, createObject
34	from zope.event import notify
35	from zope.catalog.interfaces import ICatalog
36	from hurry.workflow.interfaces import IWorkflowState, IWorkflowInfo
37	from waeup.ikoba.interfaces import (
38	IBatchProcessor, FatalCSVError, IObjectConverter, IUserAccount,
39	IObjectHistory, IGNORE_MARKER)
40	from waeup.ikoba.interfaces import IIkobaUtils
41	from waeup.ikoba.interfaces import MessageFactory as _
42	from waeup.ikoba.documents.utils import generate_document_id
43	from waeup.ikoba.customers.utils import generate_contract_id
44	from waeup.ikoba.customers.interfaces import (
45	ICustomer, ICustomerUpdateByRegNo,
46	ICustomerDocument, IContract, ISampleContract)
47	from waeup.ikoba.customers.workflow import (
48	IMPORTABLE_REGISTRATION_STATES, IMPORTABLE_REGISTRATION_TRANSITIONS)
49	from waeup.ikoba.utils.batching import BatchProcessor
50
51
52	class CustomerProcessor(BatchProcessor):
53	"""A batch processor for ICustomer objects.
54	"""
55	grok.implements(IBatchProcessor)
56	grok.provides(IBatchProcessor)
57	grok.context(Interface)
58	util_name = 'customerprocessor'
59	grok.name(util_name)
60
61	name = _('Customer Processor')
62	iface = ICustomer
63	iface_byregnumber = ICustomerUpdateByRegNo
64
65	location_fields = []
66	factory_name = 'waeup.Customer'
67
68	@property
69	def available_fields(self):
70	fields = getFields(self.iface)
71	return sorted(list(set(
72	['customer_id', 'reg_number',
73	'password', 'state', 'transition'] + fields.keys())))
74
75	def checkHeaders(self, headerfields, mode='create'):
76	if 'state' in headerfields and 'transition' in headerfields:
77	raise FatalCSVError(
78	"State and transition can't be imported at the same time!")
79	if not 'reg_number' in headerfields and not 'customer_id' \
80	in headerfields:
81	raise FatalCSVError(
82	"Need at least columns customer_id or reg_number " +
83	"for import!")
84	if mode == 'create':
85	for field in self.required_fields:
86	if not field in headerfields:
87	raise FatalCSVError(
88	"Need at least columns %s for import!" %
89	', '.join(["'%s'" % x for x in self.required_fields]))
90	# Check for fields to be ignored...
91	not_ignored_fields = [x for x in headerfields
92	if not x.startswith('--')]
93	if len(set(not_ignored_fields)) < len(not_ignored_fields):
94	raise FatalCSVError(
95	"Double headers: each column name may only appear once.")
96	return True
97
98	def parentsExist(self, row, site):
99	return 'customers' in site.keys()
100
101	def getLocator(self, row):
102	if row.get('customer_id', None) not in (None, IGNORE_MARKER):
103	return 'customer_id'
104	elif row.get('reg_number', None) not in (None, IGNORE_MARKER):
105	return 'reg_number'
106	else:
107	return None
108
109	# The entry never exists in create mode.
110	def entryExists(self, row, site):
111	return self.getEntry(row, site) is not None
112
113	def getParent(self, row, site):
114	return site['customers']
115
116	def getEntry(self, row, site):
117	if not 'customers' in site.keys():
118	return None
119	if self.getLocator(row) == 'customer_id':
120	if row['customer_id'] in site['customers']:
121	customer = site['customers'][row['customer_id']]
122	return customer
123	elif self.getLocator(row) == 'reg_number':
124	reg_number = row['reg_number']
125	cat = queryUtility(ICatalog, name='customers_catalog')
126	results = list(
127	cat.searchResults(reg_number=(reg_number, reg_number)))
128	if results:
129	return results[0]
130	return None
131
132	def addEntry(self, obj, row, site):
133	parent = self.getParent(row, site)
134	parent.addCustomer(obj)
135	# Reset _curr_cust_id if customer_id has been imported
136	if self.getLocator(row) == 'customer_id':
137	parent._curr_cust_id -= 1
138	# We have to log this if state is provided. If not,
139	# logging is done by the event handler handle_customer_added
140	if 'state' in row:
141	parent.logger.info('%s - Customer record created' % obj.customer_id)
142	history = IObjectHistory(obj)
143	history.addMessage(_('Customer record created'))
144	return
145
146	def delEntry(self, row, site):
147	customer = self.getEntry(row, site)
148	if customer is not None:
149	parent = self.getParent(row, site)
150	parent.logger.info('%s - Customer removed' % customer.customer_id)
151	del parent[customer.customer_id]
152	pass
153
154	def checkUpdateRequirements(self, obj, row, site):
155	"""Checks requirements the object must fulfill when being updated.
156
157	This method is not used in case of deleting or adding objects.
158
159	Returns error messages as strings in case of requirement
160	problems.
161	"""
162	transition = row.get('transition', IGNORE_MARKER)
163	if transition not in (IGNORE_MARKER, ''):
164	allowed_transitions = IWorkflowInfo(obj).getManualTransitionIds()
165	if transition not in allowed_transitions:
166	return 'Transition not allowed.'
167	return None
168
169	def updateEntry(self, obj, row, site, filename):
170	"""Update obj to the values given in row.
171	"""
172	items_changed = ''
173
174	# Remove customer_id from row if empty
175	if 'customer_id' in row and row['customer_id'] in (None, IGNORE_MARKER):
176	row.pop('customer_id')
177
178	# Update password
179	# XXX: Take DELETION_MARKER into consideration
180	if 'password' in row:
181	passwd = row.get('password', IGNORE_MARKER)
182	if passwd not in ('', IGNORE_MARKER):
183	if passwd.startswith('{SSHA}'):
184	# already encrypted password
185	obj.password = passwd
186	else:
187	# not yet encrypted password
188	IUserAccount(obj).setPassword(passwd)
189	items_changed += ('%s=%s, ' % ('password', passwd))
190	row.pop('password')
191
192	# Update registration state
193	if 'state' in row:
194	state = row.get('state', IGNORE_MARKER)
195	if state not in (IGNORE_MARKER, ''):
196	value = row['state']
197	IWorkflowState(obj).setState(value)
198	msg = _("State '${a}' set", mapping={'a': value})
199	history = IObjectHistory(obj)
200	history.addMessage(msg)
201	items_changed += ('%s=%s, ' % ('state', state))
202	row.pop('state')
203
204	if 'transition' in row:
205	transition = row.get('transition', IGNORE_MARKER)
206	if transition not in (IGNORE_MARKER, ''):
207	value = row['transition']
208	IWorkflowInfo(obj).fireTransition(value)
209	items_changed += ('%s=%s, ' % ('transition', transition))
210	row.pop('transition')
211
212	# apply other values...
213	items_changed += super(CustomerProcessor, self).updateEntry(
214	obj, row, site, filename)
215
216	# Log actions...
217	parent = self.getParent(row, site)
218	if hasattr(obj, 'customer_id'):
219	# Update mode: the customer exists and we can get the customer_id.
220	# Create mode: the record contains the customer_id
221	parent.logger.info(
222	'%s - %s - %s - updated: %s'
223	% (self.name, filename, obj.customer_id, items_changed))
224	else:
225	# Create mode: the customer does not yet exist
226	# XXX: It seems that this never happens because customer_id
227	# is always set.
228	parent.logger.info(
229	'%s - %s - %s - imported: %s'
230	% (self.name, filename, obj.customer_id, items_changed))
231	return items_changed
232
233	def getMapping(self, path, headerfields, mode):
234	"""Get a mapping from CSV file headerfields to actually used fieldnames.
235	"""
236	result = dict()
237	reader = csv.reader(open(path, 'rb'))
238	raw_header = reader.next()
239	for num, field in enumerate(headerfields):
240	if field not in ['customer_id', 'reg_number'] and mode == 'remove':
241	continue
242	if field == u'--IGNORE--':
243	# Skip ignored columns in failed and finished data files.
244	continue
245	result[raw_header[num]] = field
246	return result
247
248	def checkConversion(self, row, mode='create'):
249	"""Validates all values in row.
250	"""
251	iface = self.iface
252	if mode in ['update', 'remove']:
253	if self.getLocator(row) == 'reg_number':
254	iface = self.iface_byregnumber
255	converter = IObjectConverter(iface)
256	errs, inv_errs, conv_dict = converter.fromStringDict(
257	row, self.factory_name, mode=mode)
258	if 'transition' in row:
259	if row['transition'] not in IMPORTABLE_REGISTRATION_TRANSITIONS:
260	if row['transition'] not in (IGNORE_MARKER, ''):
261	errs.append(('transition', 'not allowed'))
262	if 'state' in row:
263	if row['state'] not in IMPORTABLE_REGISTRATION_STATES:
264	if row['state'] not in (IGNORE_MARKER, ''):
265	errs.append(('state', 'not allowed'))
266	else:
267	# State is an attribute of Customer and must not
268	# be changed if empty.
269	conv_dict['state'] = IGNORE_MARKER
270	try:
271	# Correct cust_id counter. As the IConverter for customers
272	# creates customer objects that are not used afterwards, we
273	# have to fix the site-wide customer_id counter.
274	site = grok.getSite()
275	customers = site['customers']
276	customers._curr_cust_id -= 1
277	except (KeyError, TypeError, AttributeError):
278	pass
279	return errs, inv_errs, conv_dict
280
281
282	class CustomerProcessorBase(BatchProcessor):
283	"""A base for customer subitem processors.
284
285	Helps reducing redundancy.
286	"""
287	grok.baseclass()
288
289	# additional available fields
290	# beside 'customer_id', 'reg_number' and 'matric_number'
291	additional_fields = []
292
293	#: header fields additionally required
294	additional_headers = []
295
296	@property
297	def available_fields(self):
298	fields = ['customer_id', 'reg_number'] + self.additional_fields
299	return sorted(list(set(fields + getFields(
300	self.iface).keys())))
301
302	def checkHeaders(self, headerfields, mode='ignore'):
303	if not 'reg_number' in headerfields and not 'customer_id' \
304	in headerfields:
305	raise FatalCSVError(
306	"Need at least columns customer_id " +
307	"or reg_number for import!")
308	for name in self.additional_headers:
309	if not name in headerfields:
310	raise FatalCSVError(
311	"Need %s for import!" % name)
312
313	# Check for fields to be ignored...
314	not_ignored_fields = [x for x in headerfields
315	if not x.startswith('--')]
316	if len(set(not_ignored_fields)) < len(not_ignored_fields):
317	raise FatalCSVError(
318	"Double headers: each column name may only appear once.")
319	return True
320
321	def _getCustomer(self, row, site):
322	NON_VALUES = ['', IGNORE_MARKER]
323	if not 'customers' in site.keys():
324	return None
325	if row.get('customer_id', '') not in NON_VALUES:
326	if row['customer_id'] in site['customers']:
327	customer = site['customers'][row['customer_id']]
328	return customer
329	elif row.get('reg_number', '') not in NON_VALUES:
330	reg_number = row['reg_number']
331	cat = queryUtility(ICatalog, name='customers_catalog')
332	results = list(
333	cat.searchResults(reg_number=(reg_number, reg_number)))
334	if results:
335	return results[0]
336	return None
337
338	def parentsExist(self, row, site):
339	return self.getParent(row, site) is not None
340
341	def entryExists(self, row, site):
342	return self.getEntry(row, site) is not None
343
344	def checkConversion(self, row, mode='ignore'):
345	"""Validates all values in row.
346	"""
347	converter = IObjectConverter(self.iface)
348	errs, inv_errs, conv_dict = converter.fromStringDict(
349	row, self.factory_name, mode=mode)
350	return errs, inv_errs, conv_dict
351
352	def getMapping(self, path, headerfields, mode):
353	"""Get a mapping from CSV file headerfields to actually used fieldnames.
354	"""
355	result = dict()
356	reader = csv.reader(open(path, 'rb'))
357	raw_header = reader.next()
358	for num, field in enumerate(headerfields):
359	if field not in ['customer_id', 'reg_number', 'document_id',
360	'code', 'level', 'contract_id'
361	] and mode == 'remove':
362	continue
363	if field == u'--IGNORE--':
364	# Skip ignored columns in failed and finished data files.
365	continue
366	result[raw_header[num]] = field
367	return result
368
369	class CustomerDocumentProcessor(CustomerProcessorBase):
370	"""A batch processor for ICustomerDocument objects.
371	"""
372	grok.implements(IBatchProcessor)
373	grok.provides(IBatchProcessor)
374	grok.context(Interface)
375	util_name = 'customerdocumentprocessor'
376	grok.name(util_name)
377
378	name = _('CustomerDocument Processor')
379	iface = ICustomerDocument
380	factory_name = 'waeup.CustomerSampleDocument'
381
382	location_fields = []
383	additional_fields = ['document_id', 'class_name']
384	additional_headers = ['class_name']
385
386	def checkHeaders(self, headerfields, mode='ignore'):
387	super(CustomerDocumentProcessor, self).checkHeaders(headerfields)
388	if mode in ('update', 'remove') and not 'document_id' in headerfields:
389	raise FatalCSVError(
390	"Need document_id for import in update and remove modes!")
391	return True
392
393	def getParent(self, row, site):
394	customer = self._getCustomer(row, site)
395	if customer is None:
396	return None
397	return customer['documents']
398
399	def getEntry(self, row, site):
400	documents = self.getParent(row, site)
401	if documents is None:
402	return None
403	document_id = row.get('document_id', None)
404	if document_id is None:
405	return None
406	entry = documents.get(document_id)
407	return entry
408
409	def updateEntry(self, obj, row, site, filename):
410	"""Update obj to the values given in row.
411	"""
412	items_changed = super(CustomerDocumentProcessor, self).updateEntry(
413	obj, row, site, filename)
414	customer = self.getParent(row, site).__parent__
415	customer.__parent__.logger.info(
416	'%s - %s - %s - updated: %s'
417	% (self.name, filename, customer.customer_id, items_changed))
418	return
419
420	def addEntry(self, obj, row, site):
421	parent = self.getParent(row, site)
422	document_id = row['document_id'].strip('#')
423	parent[document_id] = obj
424	return
425
426	def delEntry(self, row, site):
427	document = self.getEntry(row, site)
428	parent = self.getParent(row, site)
429	if document is not None:
430	customer = self._getCustomer(row, site)
431	customer.__parent__.logger.info('%s - Document removed: %s'
432	% (customer.customer_id, document.document_id))
433	del parent[document.document_id]
434	return
435
436	def checkConversion(self, row, mode='ignore'):
437	"""Validates all values in row.
438	"""
439	errs, inv_errs, conv_dict = super(
440	CustomerDocumentProcessor, self).checkConversion(row, mode=mode)
441	# We need to check if the class_name corresponds with the
442	# processor chosen. This is to avoid accidentally wrong imports.
443	if mode != 'remove':
444	class_name = row.get('class_name', None)
445	if class_name != self.factory_name.strip('waeup.'):
446	errs.append(('class_name','wrong processor'))
447	# We have to check document_id.
448	document_id = row.get('document_id', None)
449	if mode == 'create':
450	if not document_id:
451	document_id = generate_document_id()
452	conv_dict['document_id'] = document_id
453	return errs, inv_errs, conv_dict
454	cat = queryUtility(ICatalog, name='documents_catalog')
455	results = list(
456	cat.searchResults(document_id=(document_id, document_id)))
457	if results:
458	# document_id must not exist.
459	errs.append(('document_id','id exists'))
460	else:
461	if not document_id.startswith('d'):
462	errs.append(('document_id','invalid format'))
463	return errs, inv_errs, conv_dict
464
465
466	class ContractProcessor(CustomerProcessorBase):
467	"""A batch processor for IContract objects.
468	"""
469	grok.implements(IBatchProcessor)
470	grok.provides(IBatchProcessor)
471	grok.context(Interface)
472	util_name = 'contractprocessor'
473	grok.name(util_name)
474
475	name = _('Contract Processor')
476	iface = ISampleContract
477	factory_name = 'waeup.SampleContract'
478
479	location_fields = []
480	additional_fields = ['contract_id', 'class_name']
481	additional_headers = ['class_name']
482
483	def checkHeaders(self, headerfields, mode='ignore'):
484	super(ContractProcessor, self).checkHeaders(headerfields)
485	if mode in ('update', 'remove') and not 'contract_id' in headerfields:
486	raise FatalCSVError(
487	"Need contract_id for import in update and remove modes!")
488	return True
489
490	def getParent(self, row, site):
491	customer = self._getCustomer(row, site)
492	if customer is None:
493	return None
494	return customer['contracts']
495
496	def getEntry(self, row, site):
497	contracts = self.getParent(row, site)
498	if contracts is None:
499	return None
500	contract_id = row.get('contract_id', None)
501	if contract_id is None:
502	return None
503	entry = contracts.get(contract_id)
504	return entry
505
506	def updateEntry(self, obj, row, site, filename):
507	"""Update obj to the values given in row.
508	"""
509	items_changed = super(ContractProcessor, self).updateEntry(
510	obj, row, site, filename)
511	customer = self.getParent(row, site).__parent__
512	customer.__parent__.logger.info(
513	'%s - %s - %s - updated: %s'
514	% (self.name, filename, customer.customer_id, items_changed))
515	return
516
517	def addEntry(self, obj, row, site):
518	parent = self.getParent(row, site)
519	contract_id = row['contract_id'].strip('#')
520	parent[contract_id] = obj
521	return
522
523	def delEntry(self, row, site):
524	contract = self.getEntry(row, site)
525	parent = self.getParent(row, site)
526	if contract is not None:
527	customer = self._getCustomer(row, site)
528	customer.__parent__.logger.info('%s - Contract removed: %s'
529	% (customer.customer_id, contract.contract_id))
530	del parent[contract.contract_id]
531	return
532
533	def checkConversion(self, row, mode='ignore'):
534	"""Validates all values in row.
535	"""
536	errs, inv_errs, conv_dict = super(
537	ContractProcessor, self).checkConversion(row, mode=mode)
538	# We need to check if the class_name corresponds with the
539	# processor chosen. This is to avoid accidentally wrong imports.
540	if mode != 'remove':
541	class_name = row.get('class_name', None)
542	if class_name != self.factory_name.strip('waeup.'):
543	errs.append(('class_name','wrong processor'))
544	# We have to check contract_id.
545	contract_id = row.get('contract_id', None)
546	if mode == 'create':
547	if not contract_id:
548	contract_id = generate_contract_id()
549	conv_dict['contract_id'] = contract_id
550	return errs, inv_errs, conv_dict
551	cat = queryUtility(ICatalog, name='contracts_catalog')
552	results = list(
553	cat.searchResults(contract_id=(contract_id, contract_id)))
554	if results:
555	# contract_id must not exist.
556	errs.append(('contract_id','id exists'))
557	else:
558	if not contract_id.startswith('c'):
559	errs.append(('contract_id','invalid format'))
560	return errs, inv_errs, conv_dict

Note: See TracBrowser for help on using the repository browser.

Download in other formats: