- Author:
- jeanmachuca
- Posted:
- December 16, 2009
- Language:
- Python
- Version:
- 1.1
- Score:
- 0 (after 0 ratings)
This snippet is for resolve the Django-PyAMF unicode problems, through the django force_unicode function called recursively, with a tuple of different charsets.
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 | from django.conf import settings
from django.utils.encoding import DjangoUnicodeDecodeError
import logging
import os.path
LOGFILE = os.path.join(os.path.abspath(os.path.dirname(__file__)), '../log/custom-error.log')
logging.basicConfig(
level=logging.NOTSET,
format=u'%(asctime)s %(levelname)-8s %(message)s'.encode('utf-8'),
datefmt=u'%m-%d %H:%M',
#change as needed
# filename=LOGFILE,
filemode='a'
)
logging.getLogger('').setLevel(logging.NOTSET)
def warning(*arg,**kwargs):
logging.warn(*arg,**kwargs)
def desactivateDebug():
logging.disable(logging.DEBUG)
def activateDebug():
logging.getLogger('').setLevel(logging.DEBUG)
class CustomDebug(object):
def off(self):
desactivateDebug()
def on(self):
activateDebug()
def write(self,prnt):
if settings.DEBUG:
warning(prnt)
debug = CustomDebug()
class TypeManager(object):
"""
@author: Jean Machuca (Dec 16, 2009)
"""
class EncodingError(Exception):
"""Especial EncodingError exception.
Occurs when an un-existent charset is present in input string
"""
def __init__(self,*arg,**kwargs):
super(TypeManager.EncodingError,self).__init__(*arg,**kwargs)
def force_unicode(self,s, strings_only=False, errors='strict'):
""" Fix unicode string convertion by tuple charset list
Usage: In your settings.py, type:
AVAILABLE_ENCODINGS = ('ascii','utf-8','latin-1') #for example
In this example, the string is attempt to be encoded in ascii format,
then, if it fails, is attempt to be encoded in utf-8. For last, if all fails,
the latin-1 format is attempt to be encoded.
The tuple must be ordered for the minor to major character set. Example:
The latin-1 charset contains utf-8 and utf-8 contains ascii, then the tuple is
('ascii','utf-8','latin-1'). If another charset is needed (as well as 'utf-16'
that contains 'utf-8' and it's bigger than 'latin-1') then the tuple is
('ascii','utf-8','latin-1','utf-16')
When the correct unicode charsets are setted in settings.AVAILABLE_ENCODINGS,
your unicode problems are fixed !
Enjoy !
"""
u = u''
for encoding in settings.AVAILABLE_ENCODINGS:
try:
u = force_unicode(s, encoding, strings_only, errors)
return u
except (DjangoUnicodeDecodeError,UnicodeError, UnicodeEncodeError, UnicodeDecodeError),(ex):
debug.write( u'Trying to fix encoding problem: %s'%str(ex))
continue
class UnicodeFixer(object):
"""
@author: Jean Machuca (Dec 16, 2009)
Django Model Overload for PyAMF encoding fix
Usage:
In your model:
class YourNewModel(UnicodeFixer,models.Model):
...
"""
def __repr__(self):
""" repr() function overloaded. PyAMF unicode problems fixing
"""
try:
typeManager = TypeManager()
ret = typeManager.force_unicode(unicode(self))
except (UnicodeEncodeError, UnicodeDecodeError,UnicodeError), (ex):
ret = u'[BAD UNICODE]'
raise TypeManager.EncodingError (str(ex))
#Fix all non-converted characters for dumping correctly the string data
from encodings import normalize_encoding
return normalize_encoding(ret)
|
More like this
- Template tag - list punctuation for a list of items by shapiromatron 10 months, 1 week ago
- JSONRequestMiddleware adds a .json() method to your HttpRequests by cdcarter 10 months, 2 weeks ago
- Serializer factory with Django Rest Framework by julio 1 year, 5 months ago
- Image compression before saving the new model / work with JPG, PNG by Schleidens 1 year, 6 months ago
- Help text hyperlinks by sa2812 1 year, 6 months ago
Comments
Please login first before commenting.