Source code for waeup.kofa.applicants.batching

## $Id: batching.py 17787 2024-05-15 06:42:58Z henrik $
##
## Copyright (C) 2011 Uli Fouquet & Henrik Bettermann
## This program is free software; you can redistribute it and/or modify
## it under the terms of the GNU General Public License as published by
## the Free Software Foundation; either version 2 of the License, or
## (at your option) any later version.
##
## This program is distributed in the hope that it will be useful,
## but WITHOUT ANY WARRANTY; without even the implied warranty of
## MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
## GNU General Public License for more details.
##
## You should have received a copy of the GNU General Public License
## along with this program; if not, write to the Free Software
## Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
##
"""Batch processing for applicants.
"""
import unicodecsv as csv # XXX: csv ops should move to dedicated module.
import grok
from time import time
from ast import literal_eval
import unicodecsv
from zope.schema import getFields
from zope.interface import Interface
from zope.component import queryUtility, getUtility
from hurry.workflow.interfaces import IWorkflowState
from zope.catalog.interfaces import ICatalog
from waeup.kofa.interfaces import (
    IBatchProcessor, IObjectConverter, FatalCSVError,
    IGNORE_MARKER, DELETION_MARKER,
    IObjectHistory, IUserAccount, DuplicationError)
from waeup.kofa.interfaces import MessageFactory as _
from waeup.kofa.payments.interfaces import IPayer
from waeup.kofa.utils.batching import BatchProcessor
from waeup.kofa.applicants.interfaces import (
    IApplicantsContainer, IApplicant, IApplicantUpdateByRegNo,
    IApplicantOnlinePayment, IApplicantRefereeReport)
from waeup.kofa.applicants.workflow import  IMPORTABLE_STATES, CREATED

[docs]class ApplicantsContainerProcessor(BatchProcessor): """The Applicants Container Processor imports containers for applicants. It does not import their content. There is nothing special about this processor. """ grok.implements(IBatchProcessor) grok.provides(IBatchProcessor) grok.context(Interface) util_name = 'applicantscontainerprocessor' grok.name(util_name) name = _('ApplicantsContainer Processor') mode = u'create' iface = IApplicantsContainer location_fields = ['code',] factory_name = 'waeup.ApplicantsContainer'
[docs] def parentsExist(self, row, site): return 'applicants' in site.keys()
[docs] def entryExists(self, row, site): return row['code'] in site['applicants'].keys()
[docs] def getParent(self, row, site): return site['applicants']
[docs] def getEntry(self, row, site): if not self.entryExists(row, site): return None parent = self.getParent(row, site) return parent.get(row['code'])
[docs] def addEntry(self, obj, row, site): parent = self.getParent(row, site) parent[row['code']] = obj return
[docs] def delEntry(self, row, site): parent = self.getParent(row, site) del parent[row['code']] return
[docs]class ApplicantProcessor(BatchProcessor): """The Applicant Processor imports application data (applicants). In create mode `container_code` is required. If `application_number` is given, an applicant with this number is created in the designated container. If `application_number` is not given, a random `application_number` is assigned. `applicant_id` is being determined by the system and can't be imported. In update or remove mode `container_code` and `application_number` columns must not exist. The applicant object is solely localized by searching the applicants catalog for `reg_number` or `applicant_id` . """ grok.implements(IBatchProcessor) grok.provides(IBatchProcessor) grok.context(Interface) util_name = 'applicantprocessor' grok.name(util_name) name = _('Applicant Processor') iface = IApplicant iface_byregnumber = IApplicantUpdateByRegNo factory_name = 'waeup.Applicant' @property def available_fields(self): return sorted(list(set( ['application_number', 'history', 'container_code','state','password'] + getFields( self.iface).keys())))
[docs] def cheadminckHeaders(self, headerfields, mode='create'): cond1 = 'container_code' in headerfields cond2 = 'application_number' in headerfields cond3 = 'applicant_id' in headerfields cond4 = 'reg_number' in headerfields if mode == 'create': if not cond1: raise FatalCSVError( "Need at least container_code column!") if cond3: raise FatalCSVError( "applicant_id can't be imported in create mode!") for field in self.required_fields: if not field in headerfields: raise FatalCSVError( "Need at least columns %s for import!" % ', '.join(["'%s'" % x for x in self.required_fields])) if mode in ('update', 'remove'): if not cond3 and not cond4: raise FatalCSVError( "Need at least column reg_number or applicant_id!") if cond1 or cond2: raise FatalCSVError( "container_code or application_number can't be imported " + "in update or remove mode!") # Check for fields to be ignored... not_ignored_fields = [x for x in headerfields if not x.startswith('--')] if len(set(not_ignored_fields)) < len(not_ignored_fields): raise FatalCSVError( "Double headers: each column name may only appear once.") return True
[docs] def getLocator(self, row): if row.get('container_code', None) not in (IGNORE_MARKER, None): # create mode return 'container_code' elif row.get('applicant_id', None) not in (IGNORE_MARKER, None): # update or remove mode return 'applicant_id' elif row.get('reg_number', None) not in (IGNORE_MARKER, None): # update or remove mode return 'reg_number' else: return None
[docs] def getParent(self, row, site): result = None if self.getLocator(row) == 'container_code': result = site['applicants'].get(row['container_code'], None) elif self.getLocator(row) == 'reg_number': reg_number = row['reg_number'] cat = queryUtility(ICatalog, name='applicants_catalog') results = list( cat.searchResults(reg_number=(reg_number, reg_number))) if results: result = results[0].__parent__ elif self.getLocator(row) == 'applicant_id': applicant_id = row['applicant_id'] cat = queryUtility(ICatalog, name='applicants_catalog') results = list( cat.searchResults(applicant_id=(applicant_id, applicant_id))) if results: result = results[0].__parent__ return result
[docs] def parentsExist(self, row, site): return self.getParent(row, site) is not None
[docs] def getEntry(self, row, site): if self.getLocator(row) == 'container_code': if row.get('application_number', None) not in (IGNORE_MARKER, None): if not self.parentsExist(row, site): return None parent = self.getParent(row, site) return parent.get(row['application_number']) return None if self.getLocator(row) == 'applicant_id': applicant_id = row['applicant_id'] cat = queryUtility(ICatalog, name='applicants_catalog') results = list( cat.searchResults(applicant_id=(applicant_id, applicant_id))) if results: return results[0] if self.getLocator(row) == 'reg_number': reg_number = row['reg_number'] cat = queryUtility(ICatalog, name='applicants_catalog') results = list( cat.searchResults(reg_number=(reg_number, reg_number))) if results: return results[0] return None
[docs] def entryExists(self, row, site): return self.getEntry(row, site) is not None
[docs] def addEntry(self, obj, row, site): parent = self.getParent(row, site) parent.addApplicant(obj) #parent.__parent__.logger.info( # 'Applicant imported: %s' % obj.applicant_id) history = IObjectHistory(obj) history.addMessage(_('Application record imported')) return
[docs] def delEntry(self, row, site): applicant = self.getEntry(row, site) if applicant is not None: parent = applicant.__parent__ del parent[applicant.application_number] #parent.__parent__.logger.info( # 'Applicant removed: %s' % applicant.applicant_id) pass
[docs] def updateEntry(self, obj, row, site, filename): """Update obj to the values given in row. """ items_changed = '' # Remove application_number from row if empty if 'application_number' in row and row['application_number'] in ( None, IGNORE_MARKER): row.pop('application_number') # Update applicant_id fom application_number and container code # if application_number is given if 'application_number' in row: obj.applicant_id = u'%s_%s' % ( row['container_code'], row['application_number']) items_changed += ('%s=%s, ' % ('applicant_id', obj.applicant_id)) row.pop('application_number') # Update if 'password' in row: passwd = row.get('password', IGNORE_MARKER) if passwd not in ('', IGNORE_MARKER): if passwd.startswith('{SSHA}'): # already encrypted password obj.password = passwd elif passwd == DELETION_MARKER: obj.password = None else: # not yet encrypted password IUserAccount(obj).setPassword(passwd) items_changed += ('%s=%s, ' % ('password', passwd)) row.pop('password') # Replace entire history if 'history' in row: new_history = row.get('history', IGNORE_MARKER) if new_history not in (IGNORE_MARKER, ''): history = IObjectHistory(obj) history._annotations[ history.history_key] = literal_eval(new_history) items_changed += ('%s=%s, ' % ('history', new_history)) row.pop('history') # Update registration state if 'state' in row: state = row.get('state', IGNORE_MARKER) if state not in (IGNORE_MARKER, ''): IWorkflowState(obj).setState(state) msg = _("State '${a}' set", mapping = {'a':state}) history = IObjectHistory(obj) history.addMessage(msg) items_changed += ('%s=%s, ' % ('state', state)) row.pop('state') # apply other values... items_changed += super(ApplicantProcessor, self).updateEntry( obj, row, site, filename) # Log actions... parent = self.getParent(row, site) if self.getLocator(row) == 'container_code': parent.__parent__.logger.info( '%s - %s - imported: %s' % (self.name, filename, items_changed)) else: parent.__parent__.logger.info( '%s - %s - updated: %s' % (self.name, filename, items_changed)) return items_changed
[docs] def getMapping(self, path, headerfields, mode): """Get a mapping from CSV file headerfields to actually used fieldnames. """ result = dict() reader = csv.reader(open(path, 'rb')) raw_header = reader.next() for num, field in enumerate(headerfields): if field not in ['applicant_id', 'reg_number'] and mode == 'remove': continue if field == u'--IGNORE--': # Skip ignored columns in failed and finished data files. continue result[raw_header[num]] = field return result
[docs] def checkConversion(self, row, mode='create'): """Validates all values in row. """ iface = self.iface if self.getLocator(row) == 'reg_number' or mode == 'remove': iface = self.iface_byregnumber converter = IObjectConverter(iface) errs, inv_errs, conv_dict = converter.fromStringDict( row, self.factory_name, mode=mode) cert = conv_dict.get('course1', None) if cert is not None and (mode in ('create', 'update')): # course1 application category must match container's. site = grok.getSite() parent = self.getParent(row, site) if parent is None: errs.append(('container', 'not found')) elif cert.application_category != parent.application_category: errs.append(('course1', 'wrong application category')) if 'state' in row and \ not row['state'] in IMPORTABLE_STATES: if row['state'] not in (IGNORE_MARKER, ''): errs.append(('state','not allowed')) else: # state is an attribute of Applicant and must not # be changed if empty conv_dict['state'] = IGNORE_MARKER application_number = row.get('application_number', None) if application_number in (IGNORE_MARKER, ''): conv_dict['application_number'] = IGNORE_MARKER return errs, inv_errs, conv_dict
[docs] def checkUpdateRequirements(self, obj, row, site): """Checks requirements the object must fulfill when being updated. This method is not used in case of deleting or adding objects. Returns error messages as strings in case of requirement problems. """ # Block applicant with backdoor ... if obj.state == CREATED and obj.notice != 'reset': return 'Applicant is blocked.' return None
[docs]class ApplicantOnlinePaymentProcessor(BatchProcessor): """The Applicant Online Payment Processor imports applicant payment tickets. The tickets are located in the applicant container. The `checkConversion` method checks the format of the payment identifier. In create mode it does also ensures that same p_id does not exist elsewhere. It must be portal-wide unique. When adding a payment ticket, the `addEntry` method checks if a payment has already been made. If so, a `DuplicationError` is raised. """ grok.implements(IBatchProcessor) grok.provides(IBatchProcessor) grok.context(Interface) util_name = 'applicantpaymentprocessor' grok.name(util_name) name = _('ApplicantOnlinePayment Processor') iface = IApplicantOnlinePayment factory_name = 'waeup.ApplicantOnlinePayment' location_fields = ['applicant_id',] @property def available_fields(self): af = sorted(list(set( self.location_fields + getFields(self.iface).keys())) + ['p_id',]) af.remove('display_item') return af
[docs] def checkHeaders(self, headerfields, mode='ignore'): super(ApplicantOnlinePaymentProcessor, self).checkHeaders(headerfields) if mode in ('update', 'remove') and not 'p_id' in headerfields: raise FatalCSVError( "Need p_id for import in update and remove modes!") return True
[docs] def getMapping(self, path, headerfields, mode): """Get a mapping from CSV file headerfields to actually used fieldnames. """ result = dict() reader = unicodecsv.reader(open(path, 'rb')) raw_header = reader.next() for num, field in enumerate(headerfields): if field not in ['applicant_id', 'p_id'] and mode == 'remove': continue if field == u'--IGNORE--': continue result[raw_header[num]] = field return result
[docs] def parentsExist(self, row, site): return self.getParent(row, site) is not None
[docs] def getParent(self, row, site): applicant_id = row['applicant_id'] cat = queryUtility(ICatalog, name='applicants_catalog') results = list( cat.searchResults(applicant_id=(applicant_id, applicant_id))) if results: return results[0] return None
[docs] def getEntry(self, row, site): applicant = self.getParent(row, site) if applicant is None: return None p_id = row.get('p_id', None) if p_id in (None, IGNORE_MARKER): return None # We can use the hash symbol at the end of p_id in import files # to avoid annoying automatic number transformation # by Excel or Calc p_id = p_id.strip('#') entry = applicant.get(p_id) return entry
[docs] def entryExists(self, row, site): return self.getEntry(row, site) is not None
[docs] def updateEntry(self, obj, row, site, filename): """Update obj to the values given in row. """ items_changed = super(ApplicantOnlinePaymentProcessor, self).updateEntry( obj, row, site, filename) applicant = self.getParent(row, site) applicant.__parent__.__parent__.logger.info( '%s - %s - %s - updated: %s' % (self.name, filename, applicant.applicant_id, items_changed)) return
[docs] def samePaymentMade(self, applicant, category): for key in applicant.keys(): ticket = applicant[key] if ticket.p_state == 'paid' and\ ticket.p_category == category: return True return False
[docs] def addEntry(self, obj, row, site): applicant = self.getParent(row, site) p_id = row['p_id'].strip('#') if not (obj.p_item and obj.p_item.startswith( 'Balance')) and self.samePaymentMade(applicant, obj.p_category): applicant.__parent__.__parent__.logger.info( '%s - %s - previous update cancelled' % (self.name, applicant.applicant_id)) raise DuplicationError('Payment has already been made.') applicant[p_id] = obj return
[docs] def delEntry(self, row, site): payment = self.getEntry(row, site) applicant = self.getParent(row, site) if payment is not None: applicant.__parent__.__parent__.logger.info('%s - Payment ticket removed: %s' % (applicant.applicant_id, payment.p_id)) del applicant[payment.p_id] return
[docs] def checkConversion(self, row, mode='ignore'): """Validates all values in row. """ errs, inv_errs, conv_dict = super( ApplicantOnlinePaymentProcessor, self).checkConversion(row, mode=mode) # We have to check p_id. p_id = row.get('p_id', None) if mode == 'create' and p_id in (None, IGNORE_MARKER): timestamp = ("%d" % int(time()*10000))[1:] p_id = "p%s" % timestamp conv_dict['p_id'] = p_id return errs, inv_errs, conv_dict elif p_id in (None, IGNORE_MARKER): errs.append(('p_id','missing')) return errs, inv_errs, conv_dict else: p_id = p_id.strip('#') if not len(p_id) == 14: errs.append(('p_id','invalid length')) return errs, inv_errs, conv_dict if mode == 'create': cat = getUtility(ICatalog, name='payments_catalog') results = list(cat.searchResults(p_id=(p_id, p_id))) if len(results) > 0: sids = [IPayer(payment).id for payment in results] sids_string = '' for id in sids: sids_string += '%s ' % id errs.append(('p_id','p_id exists in %s' % sids_string)) return errs, inv_errs, conv_dict return errs, inv_errs, conv_dict
[docs]class ApplicantRefereeReportProcessor(BatchProcessor): """The Applicant Referee Report Processor imports applicant referee reports. The reports are located in the applicant container. """ grok.implements(IBatchProcessor) grok.provides(IBatchProcessor) grok.context(Interface) util_name = 'applicantrefereereportprocessor' grok.name(util_name) name = _('ApplicantRefereeReport Processor') iface = IApplicantRefereeReport factory_name = 'waeup.ApplicantRefereeReport' location_fields = ['applicant_id',] @property def available_fields(self): return sorted(list(set( ['r_id', 'email', 'applicant_id'] + getFields(self.iface).keys())))
[docs] def parentsExist(self, row, site): return self.getParent(row, site) is not None
[docs] def getParent(self, row, site): applicant_id = row['applicant_id'] cat = queryUtility(ICatalog, name='applicants_catalog') results = list( cat.searchResults(applicant_id=(applicant_id, applicant_id))) if results: return results[0] return None
[docs] def getEntry(self, row, site): parent = self.getParent(row, site) if parent is None: return None return parent.get(row['r_id'])
[docs] def entryExists(self, row, site): return self.getEntry(row, site) is not None
[docs] def updateEntry(self, obj, row, site, filename): """Update obj to the values given in row. """ items_changed = super(ApplicantRefereeReportProcessor, self).updateEntry( obj, row, site, filename) applicant = self.getParent(row, site) applicant.__parent__.__parent__.logger.info( '%s - %s - %s - updated: %s' % (self.name, filename, applicant.applicant_id, items_changed)) return
[docs] def addEntry(self, obj, row, site): parent = self.getParent(row, site) parent[row['r_id']] = obj return
[docs] def delEntry(self, row, site): report = self.getEntry(row, site) parent = self.getParent(row, site) if report is not None: parent.__parent__.__parent__.logger.info( '%s - Referee Report removed' % report.r_id) del parent[report.r_id] return