summaryrefslogtreecommitdiffstats
path: root/pykolab/translit.py
blob: 119675f3b758d3550ebb8f14bc45dfceae15a729 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
# -*- coding: utf-8 -*-
# Copyright 2010-2012 Kolab Systems AG (http://www.kolabsys.com)
#
# Jeroen van Meeuwen (Kolab Systems) <vanmeeuwen a kolabsys.com>
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; version 3 or, at your option, any later version
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
# GNU Library General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
#

import pykolab
from pykolab.translate import _

log = pykolab.getLogger('pykolab.translit')

locale_translit_map = {
        'ru_RU': 'cyrillic'
    }

translit_map = {
        'cyrillic': {
                u'А': 'A',
                u'а': 'a',
                u'Б': 'B',
                u'б': 'b',
                u'В': 'V',
                u'в': 'v',
                u'Г': 'G',
                u'г': 'g',
                u'Д': 'D',
                u'д': 'd',
                u'Е': 'E',
                u'е': 'e',
                u'Ё': 'Yo',
                u'ё': 'e',
                u'Ж': 'Zh',
                u'ж': 'zh',
                u'З': 'Z',
                u'з': 'z',
                u'И': 'I',
                u'и': 'i',
                u'Й': 'J',
                u'й': 'j',
                u'К': 'K',
                u'к': 'k',
                u'Л': 'L',
                u'л': 'l',
                u'М': 'M',
                u'м': 'm',
                u'Н': 'N',
                u'н': 'n',
                u'О': 'O',
                u'о': 'o',
                u'П': 'P',
                u'п': 'p',
                u'Р': 'R',
                u'р': 'r',
                u'С': 'S',
                u'с': 's',
                u'Т': 'T',
                u'т': 't',
                u'У': 'U',
                u'у': 'u',
                u'Ф': 'F',
                u'ф': 'f',
                u'Х': 'Kh',
                u'х': 'kh',
                u'Ц': 'Tc',
                u'ц': 'tc',
                u'Ч': 'Ch',
                u'ч': 'ch',
                u'Ш': 'Sh',
                u'ш': 'sh',
                u'Щ': 'Shch',
                u'щ': 'shch',
                u'Ъ': '',
                u'ъ': '',
                u'Ы': 'Y',
                u'ы': 'y',
                u'Ь': '',
                u'ь': '',
                u'Э': 'E',
                u'э': 'e',
                u'Ю': 'Yu',
                u'ю': 'yu',
                u'Я': 'Ya',
                u'я': 'ya',
            }
    }

def transliterate(_input, lang, _output_expected=None):
    _translit_name = locale_translit_map[lang]

    _output = ''

    for char in _input.decode('utf-8'):
        if translit_map[_translit_name].has_key(char):
            _output += translit_map[_translit_name][char]
        elif char in [repr(x) for x in translit_map[_translit_name].keys()]:
            _output += translit_map[_translit_name][[char in [raw(x) for x in translit_map[_translit_name].keys()]][0]]
        else:
            _output += char

    return _output