wordfreq/tests/test_serbian.py

from nose.tools import eq_
from wordfreq import tokenize


def test_transliteration():
    # "Well, there's a lot of things you do not understand."
    # (from somewhere in OpenSubtitles)
    eq_(tokenize("Па, има ту много ствари које не схваташ.", 'sr'),
        ['pa', 'ima', 'tu', 'mnogo', 'stvari', 'koje', 'ne', 'shvataš'])
    eq_(tokenize("Pa, ima tu mnogo stvari koje ne shvataš.", 'sr'),
        ['pa', 'ima', 'tu', 'mnogo', 'stvari', 'koje', 'ne', 'shvataš'])
Add transliteration of Cyrillic Serbian 2016-12-29 23:27:17 +00:00			`from nose.tools import eq_`
			`from wordfreq import tokenize`


			`def test_transliteration():`
			`# "Well, there's a lot of things you do not understand."`
			`# (from somewhere in OpenSubtitles)`
			`eq_(tokenize("Па, има ту много ствари које не схваташ.", 'sr'),`
			`['pa', 'ima', 'tu', 'mnogo', 'stvari', 'koje', 'ne', 'shvataš'])`
			`eq_(tokenize("Pa, ima tu mnogo stvari koje ne shvataš.", 'sr'),`
			`['pa', 'ima', 'tu', 'mnogo', 'stvari', 'koje', 'ne', 'shvataš'])`