X-Git-Url: http://git.tomasm.cz/krypto.git/blobdiff_plain/d7c8d3913bbc5a2119789f1d82c2f3de3f3fa1f3..368fec422dea37982a9577a953efad47c47db524:/ocesavac.py diff --git a/ocesavac.py b/ocesavac.py index 31e49fb..e1d0f59 100644 --- a/ocesavac.py +++ b/ocesavac.py @@ -1,25 +1,29 @@ +"""Modul pro odstranovani diakritiky a zvlastnich znaku.""" import unicodedata ABECEDA = 'ABCDEFGHIJKLMNOPQRSTUVWXYZ' def deaccent(unistr): + """Vrati text bez akcentu. Pochybna metoda pouzivajici unicodedata.""" return ''.join(aChar for aChar in unicodedata.normalize('NFD', unistr) if not unicodedata.combining(aChar)) def ocesat(text, mezery=True): + """Odstrani z textu akcenty, zvlastni znaky nahradi mezerami, posloupnost + mezer jednou mezerou a prevede vsechna pismena na velka.""" text = deaccent(unicode(text)).upper() if mezery: pole = [' '] - lastWh = True - for c in text: - if c in ABECEDA: - pole.append(c) - lastWh = False - elif not lastWh: + last_white = True + for char in text: + if char in ABECEDA: + pole.append(char) + last_white = False + elif not last_white: pole.append(' ') - lastWh = True - if not lastWh: + last_white = True + if not last_white: pole.append(' ') return ''.join(pole) else: # bez mezer