226 lines
8.8 KiB
Python
226 lines
8.8 KiB
Python
# -*- coding: utf-8 -*-
|
|
"""
|
|
Mexican-specific form helpers.
|
|
"""
|
|
import re
|
|
|
|
from django.forms import ValidationError
|
|
from django.forms.fields import Select, RegexField
|
|
from django.utils.translation import ugettext_lazy as _
|
|
from django.core.validators import EMPTY_VALUES
|
|
from django.contrib.localflavor.mx.mx_states import STATE_CHOICES
|
|
|
|
DATE_RE = r'\d{2}((01|03|05|07|08|10|12)(0[1-9]|[12]\d|3[01])|02(0[1-9]|[12]\d)|(04|06|09|11)(0[1-9]|[12]\d|30))'
|
|
|
|
"""
|
|
This is the list of inconvenient words according to the `Anexo IV` of the
|
|
document described in the next link:
|
|
http://www.sisi.org.mx/jspsi/documentos/2005/seguimiento/06101/0610100162005_065.doc
|
|
"""
|
|
|
|
RFC_INCONVENIENT_WORDS = [
|
|
u'BUEI', u'BUEY', u'CACA', u'CACO', u'CAGA', u'CAGO', u'CAKA', u'CAKO',
|
|
u'COGE', u'COJA', u'COJE', u'COJI', u'COJO', u'CULO', u'FETO', u'GUEY',
|
|
u'JOTO', u'KACA', u'KACO', u'KAGA', u'KAGO', u'KOGE', u'KOJO', u'KAKA',
|
|
u'KULO', u'MAME', u'MAMO', u'MEAR', u'MEAS', u'MEON', u'MION', u'MOCO',
|
|
u'MULA', u'PEDA', u'PEDO', u'PENE', u'PUTA', u'PUTO', u'QULO', u'RATA',
|
|
u'RUIN',
|
|
]
|
|
|
|
"""
|
|
This is the list of inconvenient words according to the `Anexo 2` of the
|
|
document described in the next link:
|
|
http://portal.veracruz.gob.mx/pls/portal/url/ITEM/444112558A57C6E0E040A8C02E00695C
|
|
"""
|
|
CURP_INCONVENIENT_WORDS = [
|
|
u'BACA', u'BAKA', u'BUEI', u'BUEY', u'CACA', u'CACO', u'CAGA', u'CAGO',
|
|
u'CAKA', u'CAKO', u'COGE', u'COGI', u'COJA', u'COJE', u'COJI', u'COJO',
|
|
u'COLA', u'CULO', u'FALO', u'FETO', u'GETA', u'GUEI', u'GUEY', u'JETA',
|
|
u'JOTO', u'KACA', u'KACO', u'KAGA', u'KAGO', u'KAKA', u'KAKO', u'KOGE',
|
|
u'KOGI', u'KOJA', u'KOJE', u'KOJI', u'KOJO', u'KOLA', u'KULO', u'LILO',
|
|
u'LOCA', u'LOCO', u'LOKA', u'LOKO', u'MAME', u'MAMO', u'MEAR', u'MEAS',
|
|
u'MEON', u'MIAR', u'MION', u'MOCO', u'MOKO', u'MULA', u'MULO', u'NACA',
|
|
u'NACO', u'PEDA', u'PEDO', u'PENE', u'PIPI', u'PITO', u'POPO', u'PUTA',
|
|
u'PUTO', u'QULO', u'RATA', u'ROBA', u'ROBE', u'ROBO', u'RUIN', u'SENO',
|
|
u'TETA', u'VACA', u'VAGA', u'VAGO', u'VAKA', u'VUEI', u'VUEY', u'WUEI',
|
|
u'WUEY',
|
|
]
|
|
|
|
class MXStateSelect(Select):
|
|
"""
|
|
A Select widget that uses a list of Mexican states as its choices.
|
|
"""
|
|
def __init__(self, attrs=None):
|
|
super(MXStateSelect, self).__init__(attrs, choices=STATE_CHOICES)
|
|
|
|
|
|
class MXZipCodeField(RegexField):
|
|
"""
|
|
A form field that accepts a Mexican Zip Code.
|
|
|
|
More info about this:
|
|
http://en.wikipedia.org/wiki/List_of_postal_codes_in_Mexico
|
|
"""
|
|
default_error_messages = {
|
|
'invalid': _(u'Enter a valid zip code in the format XXXXX.'),
|
|
}
|
|
|
|
def __init__(self, *args, **kwargs):
|
|
zip_code_re = ur'^(0[1-9]|[1][0-6]|[2-9]\d)(\d{3})$'
|
|
super(MXZipCodeField, self).__init__(zip_code_re, *args, **kwargs)
|
|
|
|
|
|
class MXRFCField(RegexField):
|
|
"""
|
|
A form field that validates a Mexican *Registro Federal de Contribuyentes*
|
|
for either `Persona física` or `Persona moral`.
|
|
|
|
The Persona física RFC string is integrated by a juxtaposition of
|
|
characters following the next pattern:
|
|
|
|
===== ====== ===========================================
|
|
Index Format Accepted Characters
|
|
===== ====== ===========================================
|
|
1 X Any letter
|
|
2 X Any vowel
|
|
3-4 XX Any letter
|
|
5-10 YYMMDD Any valid date
|
|
11-12 XX Any letter or number between 0 and 9
|
|
13 X Any digit between 0 and 9 or the letter *A*
|
|
===== ====== ===========================================
|
|
|
|
The Persona moral RFC string is integrated by a juxtaposition of
|
|
characters following the next pattern:
|
|
|
|
===== ====== ============================================
|
|
Index Format Accepted Characters
|
|
===== ====== ============================================
|
|
1-3 XXX Any letter including *&* and *Ñ* chars
|
|
4-9 YYMMDD Any valid date
|
|
10-11 XX Any letter or number between 0 and 9
|
|
12 X Any number between 0 and 9 or the letter *A*
|
|
===== ====== ============================================
|
|
|
|
More info about this:
|
|
http://es.wikipedia.org/wiki/Registro_Federal_de_Contribuyentes_(M%C3%A9xico)
|
|
"""
|
|
default_error_messages = {
|
|
'invalid': _('Enter a valid RFC.'),
|
|
'invalid_checksum': _('Invalid checksum for RFC.'),
|
|
}
|
|
|
|
def __init__(self, min_length=9, max_length=13, *args, **kwargs):
|
|
rfc_re = re.compile(ur'^([A-Z&Ññ]{3}|[A-Z][AEIOU][A-Z]{2})%s([A-Z0-9]{2}[0-9A])?$' % DATE_RE,
|
|
re.IGNORECASE)
|
|
super(MXRFCField, self).__init__(rfc_re, min_length=min_length,
|
|
max_length=max_length, *args, **kwargs)
|
|
|
|
def clean(self, value):
|
|
value = super(MXRFCField, self).clean(value)
|
|
if value in EMPTY_VALUES:
|
|
return u''
|
|
value = value.upper()
|
|
if self._has_homoclave(value):
|
|
if not value[-1] == self._checksum(value[:-1]):
|
|
raise ValidationError(self.default_error_messages['invalid_checksum'])
|
|
if self._has_inconvenient_word(value):
|
|
raise ValidationError(self.default_error_messages['invalid'])
|
|
return value
|
|
|
|
def _has_homoclave(self, rfc):
|
|
"""
|
|
This check is done due to the existance of RFCs without a *homoclave*
|
|
since the current algorithm to calculate it had not been created for
|
|
the first RFCs ever in Mexico.
|
|
"""
|
|
rfc_without_homoclave_re = re.compile(ur'^[A-Z&Ññ]{3,4}%s$' % DATE_RE,
|
|
re.IGNORECASE)
|
|
return not rfc_without_homoclave_re.match(rfc)
|
|
|
|
def _checksum(self, rfc):
|
|
"""
|
|
More info about this procedure:
|
|
www.sisi.org.mx/jspsi/documentos/2005/seguimiento/06101/0610100162005_065.doc
|
|
"""
|
|
chars = u'0123456789ABCDEFGHIJKLMN&OPQRSTUVWXYZ-Ñ'
|
|
if len(rfc) == 11:
|
|
rfc = '-' + rfc
|
|
|
|
sum_ = sum(i * chars.index(c) for i, c in zip(reversed(xrange(14)), rfc))
|
|
checksum = 11 - sum_ % 11
|
|
|
|
if checksum == 10:
|
|
return u'A'
|
|
elif checksum == 11:
|
|
return u'0'
|
|
|
|
return unicode(checksum)
|
|
|
|
def _has_inconvenient_word(self, rfc):
|
|
first_four = rfc[:4]
|
|
return first_four in RFC_INCONVENIENT_WORDS
|
|
|
|
|
|
class MXCURPField(RegexField):
|
|
"""
|
|
A field that validates a Mexican Clave Única de Registro de Población.
|
|
|
|
The CURP is integrated by a juxtaposition of characters following the next
|
|
pattern:
|
|
|
|
===== ====== ===================================================
|
|
Index Format Accepted Characters
|
|
===== ====== ===================================================
|
|
1 X Any letter
|
|
2 X Any vowel
|
|
3-4 XX Any letter
|
|
5-10 YYMMDD Any valid date
|
|
11 X Either `H` or `M`, depending on the person's gender
|
|
12-13 XX Any valid acronym for a state in Mexico
|
|
14-16 XXX Any consonant
|
|
17 X Any number between 0 and 9 or any letter
|
|
18 X Any number between 0 and 9
|
|
===== ====== ===================================================
|
|
|
|
More info about this:
|
|
http://www.condusef.gob.mx/index.php/clave-unica-de-registro-de-poblacion-curp
|
|
"""
|
|
default_error_messages = {
|
|
'invalid': _('Enter a valid CURP.'),
|
|
'invalid_checksum': _(u'Invalid checksum for CURP.'),
|
|
}
|
|
|
|
def __init__(self, min_length=18, max_length=18, *args, **kwargs):
|
|
states_re = r'(AS|BC|BS|CC|CL|CM|CS|CH|DF|DG|GT|GR|HG|JC|MC|MN|MS|NT|NL|OC|PL|QT|QR|SP|SL|SR|TC|TS|TL|VZ|YN|ZS|NE)'
|
|
consonants_re = r'[B-DF-HJ-NP-TV-Z]'
|
|
curp_re = (ur'^[A-Z][AEIOU][A-Z]{2}%s[HM]%s%s{3}[0-9A-Z]\d$' %
|
|
(DATE_RE, states_re, consonants_re))
|
|
curp_re = re.compile(curp_re, re.IGNORECASE)
|
|
super(MXCURPField, self).__init__(curp_re, min_length=min_length,
|
|
max_length=max_length, *args, **kwargs)
|
|
|
|
def clean(self, value):
|
|
value = super(MXCURPField, self).clean(value)
|
|
if value in EMPTY_VALUES:
|
|
return u''
|
|
value = value.upper()
|
|
if value[-1] != self._checksum(value[:-1]):
|
|
raise ValidationError(self.default_error_messages['invalid_checksum'])
|
|
if self._has_inconvenient_word(value):
|
|
raise ValidationError(self.default_error_messages['invalid'])
|
|
return value
|
|
|
|
def _checksum(self, value):
|
|
chars = u'0123456789ABCDEFGHIJKLMN&OPQRSTUVWXYZ'
|
|
|
|
s = sum(i * chars.index(c) for i, c in zip(reversed(xrange(19)), value))
|
|
checksum = 10 - s % 10
|
|
|
|
if checksum == 10:
|
|
return u'0'
|
|
return unicode(checksum)
|
|
|
|
def _has_inconvenient_word(self, curp):
|
|
first_four = curp[:4]
|
|
return first_four in CURP_INCONVENIENT_WORDS
|