| Trees | Indices | Help | 
 | 
|---|
|  | 
 1  #!/usr/bin/env python 
 2  # -*- coding: utf-8 -*- 
 3  #  
 4  # Copyright 2007 Zuza Software Foundation 
 5  #  
 6  # This file is part of translate. 
 7  # 
 8  # translate is free software; you can redistribute it and/or modify 
 9  # it under the terms of the GNU General Public License as published by 
10  # the Free Software Foundation; either version 2 of the License, or 
11  # (at your option) any later version. 
12  #  
13  # translate is distributed in the hope that it will be useful, 
14  # but WITHOUT ANY WARRANTY; without even the implied warranty of 
15  # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the 
16  # GNU General Public License for more details. 
17  # 
18  # You should have received a copy of the GNU General Public License 
19  # along with translate; if not, write to the Free Software 
20  # Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA 
21   
22  """This module represents Chinese language. (Both tradisional and simplified) 
23   
24  For more information, see U{http://en.wikipedia.org/wiki/Chinese_language} 
25  """ 
26   
27  from translate.lang import common 
28  import re 
29   
31      """This class represents Chinese.""" 
32      code = "zh" 
33      fullname = "Chinese" 
34      nplurals = 1 
35      pluralequation = "0" 
36   
37      listseperator = u"、" 
38   
39      sentenceend = u"。!?…" 
40   
41      # Compared to common.py, we make the space after the sentence ending  
42      # optional and don't demand an uppercase letter to follow. 
43      sentencere = re.compile(r"""(?s)    #make . also match newlines     
44                              .*?         #any text, but match non-greedy 
45                              [%s]        #the puntuation for sentence ending 
46                              \s*         #the optional space after the puntuation 
47                              """ % sentenceend, re.VERBOSE) 
48   
49      # The following transformation rules should be mostly useful for all types 
50      # of Chinese. The comma (,) is not handled here, since it maps to two  
51      # different characters, depending on context. 
52      # If comma is used as seperation of sentence, then it is converted to a  
53      # fullwidth comma (","). If comma is used as seperation of list items like 
54      # "apple, orange, grape, .....", "、" is used. 
55      puncdict = { 
56          u". ": u"。", 
57          u"; ": u";", 
58          u": ": u":", 
59          u"! ": u"!", 
60          u"? ": u"?", 
61          u".\n": u"。\n", 
62          u";\n": u";\n", 
63          u":\n": u":\n", 
64          u"!\n": u"!\n", 
65          u"?\n": u"?", 
66          u"% ": u"%", 
67          u" (": u"(", 
68          u") ": u")", 
69      } 
70   
71      ignoretests = ["startcaps", "simplecaps"] 
72   
| Trees | Indices | Help | 
 | 
|---|
| Generated by Epydoc 3.0.1 on Wed Mar 26 12:49:42 2008 | http://epydoc.sourceforge.net |