forgot about Italian

This commit is contained in:
Rob Speer 2015-11-30 18:18:24 -05:00
parent 5ef807117d
commit 8f6cd0e57b

View File

@ -48,8 +48,8 @@ def cld2_surface_tokenizer(text):
# Low-frequency languages tend to be detected incorrectly. Keep a limited # Low-frequency languages tend to be detected incorrectly. Keep a limited
# list of languages we're allowed to use here. # list of languages we're allowed to use here.
KEEP_THESE_LANGUAGES = { KEEP_THESE_LANGUAGES = {
'ar', 'de', 'el', 'en', 'es', 'fr', 'hr', 'id', 'ja', 'ko', 'ms', 'nl', 'ar', 'de', 'el', 'en', 'es', 'fr', 'hr', 'id', 'it', 'ja', 'ko', 'ms',
'pl', 'pt', 'ro', 'ru', 'sv', 'th' 'nl', 'pl', 'pt', 'ro', 'ru', 'sv', 'th'
} }