mirror of
https://github.com/rspeer/wordfreq.git
synced 2024-12-23 17:31:41 +00:00
configuration that builds some larger lists
Former-commit-id: c1a12cebec
This commit is contained in:
parent
35ee23591e
commit
3b95d349e0
@ -60,7 +60,8 @@ CONFIG = {
|
||||
'twitter-dist': 'dist/twitter_{lang}.{ext}',
|
||||
'jieba-dist': 'dist/jieba_{lang}.{ext}'
|
||||
},
|
||||
'min_sources': 2
|
||||
'min_sources': 2,
|
||||
'big-lists': ['en', 'fr', 'es', 'pt']
|
||||
}
|
||||
|
||||
|
||||
|
@ -353,9 +353,11 @@ def combine_lists(languages):
|
||||
params={'lang': language, 'buckets': 600})
|
||||
add_dep(lines, 'freqs2cB', output_file, output_cBpack_big,
|
||||
extra='wordfreq_builder/word_counts.py',
|
||||
params={'lang': language, 'buckets': 900})
|
||||
params={'lang': language, 'buckets': 800})
|
||||
|
||||
lines.append('default {}'.format(output_cBpack))
|
||||
if language in CONFIG['big-lists']:
|
||||
lines.append('default {}'.format(output_cBpack_big))
|
||||
|
||||
# Write standalone lists for Twitter frequency
|
||||
if language in CONFIG['sources']['twitter']:
|
||||
|
Loading…
Reference in New Issue
Block a user