mirror of
https://github.com/rspeer/wordfreq.git
synced 2024-12-24 01:41:39 +00:00
f0c7c3a02c
Former-commit-id: 5c8c36f4e3
24 lines
683 B
Python
24 lines
683 B
Python
from nose.tools import eq_, assert_almost_equal
|
|
from wordfreq import tokenize, word_frequency
|
|
|
|
|
|
def test_tokens():
|
|
eq_(tokenize('おはようございます', 'ja'),
|
|
['おはよう', 'ござい', 'ます'])
|
|
|
|
|
|
def test_combination():
|
|
ohayou_freq = word_frequency('おはよう', 'ja')
|
|
gozai_freq = word_frequency('ござい', 'ja')
|
|
masu_freq = word_frequency('ます', 'ja')
|
|
|
|
assert_almost_equal(
|
|
word_frequency('おはようおはよう', 'ja'),
|
|
ohayou_freq / 20
|
|
)
|
|
assert_almost_equal(
|
|
1.0 / word_frequency('おはようございます', 'ja'),
|
|
(100.0 / ohayou_freq + 100.0 / gozai_freq + 100.0 / masu_freq)
|
|
)
|
|
|