mirror of
https://github.com/rspeer/wordfreq.git
synced 2024-12-23 09:21:37 +00:00
configuration that builds some larger lists
This commit is contained in:
parent
9907948d11
commit
c1a12cebec
@ -60,7 +60,8 @@ CONFIG = {
|
||||
'twitter-dist': 'dist/twitter_{lang}.{ext}',
|
||||
'jieba-dist': 'dist/jieba_{lang}.{ext}'
|
||||
},
|
||||
'min_sources': 2
|
||||
'min_sources': 2,
|
||||
'big-lists': ['en', 'fr', 'es', 'pt']
|
||||
}
|
||||
|
||||
|
||||
|
@ -353,9 +353,11 @@ def combine_lists(languages):
|
||||
params={'lang': language, 'buckets': 600})
|
||||
add_dep(lines, 'freqs2cB', output_file, output_cBpack_big,
|
||||
extra='wordfreq_builder/word_counts.py',
|
||||
params={'lang': language, 'buckets': 900})
|
||||
params={'lang': language, 'buckets': 800})
|
||||
|
||||
lines.append('default {}'.format(output_cBpack))
|
||||
if language in CONFIG['big-lists']:
|
||||
lines.append('default {}'.format(output_cBpack_big))
|
||||
|
||||
# Write standalone lists for Twitter frequency
|
||||
if language in CONFIG['sources']['twitter']:
|
||||
|
Loading…
Reference in New Issue
Block a user