#!/usr/bin/env python # -*- coding: utf-8 -*- from translate.lang import factory def test_punctranslate(): """Tests that we can translate punctuation.""" language = factory.getlanguage('km') assert language.punctranslate(u"abc efg") == u"abc efg" assert language.punctranslate(u"abc efg.") == u"abc efg\u00a0។" print language.punctranslate(u"abc efg. hij.").encode('utf-8') print u"abc efg\u00a0។ hij\u00a0។".encode('utf-8') assert language.punctranslate(u"abc efg. hij.") == u"abc efg\u00a0។ hij\u00a0។" assert language.punctranslate(u"abc efg!") == u"abc efg\u00a0!" assert language.punctranslate(u"abc efg? hij!") == u"abc efg\u00a0? hij\u00a0!" assert language.punctranslate(u"Delete file: %s?") == u"Delete file\u00a0៖ %s\u00a0?" def test_sentences(): """Tests basic functionality of sentence segmentation.""" language = factory.getlanguage('km') sentences = language.sentences(u"លក្ខណៈ​​នេះ​អាច​ឲ្យ​យើងធ្វើ​ជាតូបនីយកម្មកម្មវិធី​កុំព្យូទ័រ​ ។ លក្ខណៈ​​នេះ​អាច​ឲ្យ​យើងធ្វើ​ជាតូបនីយកម្មកម្មវិធី​កុំព្យូទ័រ​ ។") assert sentences == [u"លក្ខណៈ​​នេះ​អាច​ឲ្យ​យើងធ្វើ​ជាតូបនីយកម្មកម្មវិធី​កុំព្យូទ័រ​ ។", u"លក្ខណៈ​​នេះ​អាច​ឲ្យ​យើងធ្វើ​ជាតូបនីយកម្មកម្មវិធី​កុំព្យូទ័រ​ ។"]