From 59363c8c442edd3b1a0c3516ec16ff23a7944947 Mon Sep 17 00:00:00 2001 From: Robyn Speer Date: Tue, 8 Sep 2015 16:15:08 -0400 Subject: [PATCH] update comments in wordfreq_builder.config; remove unused 'version' Former-commit-id: bc323eccaf4188c4cd4d55d8f87fa8e27bc0c6bb --- wordfreq_builder/wordfreq_builder/config.py | 6 ++---- 1 file changed, 2 insertions(+), 4 deletions(-) diff --git a/wordfreq_builder/wordfreq_builder/config.py b/wordfreq_builder/wordfreq_builder/config.py index 00cd695..fd637e8 100644 --- a/wordfreq_builder/wordfreq_builder/config.py +++ b/wordfreq_builder/wordfreq_builder/config.py @@ -1,19 +1,17 @@ import os CONFIG = { - 'version': '1.0b', # data_dir is a relative or absolute path to where the wordlist data # is stored 'data_dir': 'data', 'sources': { - # A list of language codes (possibly un-standardized) that we'll - # look up in filenames for these various data sources. + # A list of language codes that we'll look up in filenames for these + # various data sources. # # Consider adding: # 'th' when we get tokenization for it # 'hi' when we stop messing up its tokenization # 'tl' with one more data source - # 'sv' because its data sources are ready 'twitter': [ 'ar', 'de', 'el', 'en', 'es', 'fr', 'id', 'it', 'ja', 'ko', 'ms', 'nl', 'pl', 'pt', 'ru', 'sv', 'tr'