Web   ·   Wiki   ·   Activities   ·   Blog   ·   Lists   ·   Chat   ·   Meeting   ·   Bugs   ·   Git   ·   Translate   ·   Archive   ·   People   ·   Donate
summaryrefslogtreecommitdiffstats
path: root/translate-toolkit-1.5.1/translate/lang/zh.py
diff options
context:
space:
mode:
Diffstat (limited to 'translate-toolkit-1.5.1/translate/lang/zh.py')
-rw-r--r--translate-toolkit-1.5.1/translate/lang/zh.py67
1 files changed, 67 insertions, 0 deletions
diff --git a/translate-toolkit-1.5.1/translate/lang/zh.py b/translate-toolkit-1.5.1/translate/lang/zh.py
new file mode 100644
index 0000000..7f56b0e
--- /dev/null
+++ b/translate-toolkit-1.5.1/translate/lang/zh.py
@@ -0,0 +1,67 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+#
+# Copyright 2007 Zuza Software Foundation
+#
+# This file is part of translate.
+#
+# translate is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+#
+# translate is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with translate; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
+
+"""This module represents Chinese language. (Both tradisional and simplified)
+
+For more information, see U{http://en.wikipedia.org/wiki/Chinese_language}
+"""
+
+from translate.lang import common
+import re
+
+class zh(common.Common):
+ """This class represents Chinese."""
+
+ listseperator = u"、"
+
+ sentenceend = u"。!?…"
+
+ # Compared to common.py, we make the space after the sentence ending
+ # optional and don't demand an uppercase letter to follow.
+ sentencere = re.compile(r"""(?s) #make . also match newlines
+ .*? #any text, but match non-greedy
+ [%s] #the puntuation for sentence ending
+ \s* #the optional space after the puntuation
+ """ % sentenceend, re.VERBOSE)
+
+ # The following transformation rules should be mostly useful for all types
+ # of Chinese. The comma (,) is not handled here, since it maps to two
+ # different characters, depending on context.
+ # If comma is used as seperation of sentence, it should be converted to a
+ # fullwidth comma (","). If comma is used as seperation of list items like
+ # "apple, orange, grape, .....", "、" is used.
+ puncdict = {
+ u". ": u"。",
+ u"; ": u";",
+ u": ": u":",
+ u"! ": u"!",
+ u"? ": u"?",
+ u".\n": u"。\n",
+ u";\n": u";\n",
+ u":\n": u":\n",
+ u"!\n": u"!\n",
+ u"?\n": u"?",
+ u"% ": u"%",
+ }
+
+ length_difference = lambda cls, x: 10 - x/2
+
+ ignoretests = ["startcaps", "simplecaps"]