1 files changed, 67 insertions, 0 deletions
diff --git a/translate-toolkit-1.5.1/translate/lang/zh.py b/translate-toolkit-1.5.1/translate/lang/zh.py
new file mode 100644
index 0000000..7f56b0e
--- /dev/null
+++ b/translate-toolkit-1.5.1/translate/lang/zh.py
@@ -0,0 +1,67 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+# 
+# Copyright 2007 Zuza Software Foundation
+# 
+# This file is part of translate.
+#
+# translate is free software; you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation; either version 2 of the License, or
+# (at your option) any later version.
+# 
+# translate is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+#
+# You should have received a copy of the GNU General Public License
+# along with translate; if not, write to the Free Software
+# Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA  02111-1307  USA
+
+"""This module represents Chinese language. (Both tradisional and simplified)
+
+For more information, see U{http://en.wikipedia.org/wiki/Chinese_language}
+"""
+
+from translate.lang import common
+import re
+
+class zh(common.Common):
+    """This class represents Chinese."""
+
+    listseperator = u"、"
+
+    sentenceend = u"。！？…"
+
+    # Compared to common.py, we make the space after the sentence ending 
+    # optional and don't demand an uppercase letter to follow.
+    sentencere = re.compile(r"""(?s)    #make . also match newlines    
+                            .*?         #any text, but match non-greedy
+                            [%s]        #the puntuation for sentence ending
+                            \s*         #the optional space after the puntuation
+                            """ % sentenceend, re.VERBOSE)
+
+    # The following transformation rules should be mostly useful for all types
+    # of Chinese. The comma (,) is not handled here, since it maps to two 
+    # different characters, depending on context.
+    # If comma is used as seperation of sentence, it should be converted to a 
+    # fullwidth comma ("，"). If comma is used as seperation of list items like
+    # "apple, orange, grape, .....", "、" is used.
+    puncdict = {
+        u". ": u"。",
+        u"; ": u"；",
+        u": ": u"：",
+        u"! ": u"！",
+        u"? ": u"？",
+        u".\n": u"。\n",
+        u";\n": u"；\n",
+        u":\n": u"：\n",
+        u"!\n": u"！\n",
+        u"?\n": u"？",
+        u"% ": u"%",
+    }
+
+    length_difference = lambda cls, x: 10 - x/2
+
+    ignoretests = ["startcaps", "simplecaps"]