mirror of
https://github.com/rspeer/wordfreq.git
synced 2024-12-23 17:31:41 +00:00
disregard Arabic Reddit spam
This commit is contained in:
parent
6feae99381
commit
cfe68893fa
@ -42,8 +42,7 @@ CONFIG = {
|
|||||||
'subtlex-other': ['de', 'nl', 'zh'],
|
'subtlex-other': ['de', 'nl', 'zh'],
|
||||||
'jieba': ['zh'],
|
'jieba': ['zh'],
|
||||||
'reddit': [
|
'reddit': [
|
||||||
'ar', 'de', 'en', 'es', 'fr', 'it', 'ja', 'pl', 'pt', 'ro',
|
'de', 'en', 'es', 'fr', 'it', 'ja', 'pl', 'pt', 'ro', 'ru', 'sv'
|
||||||
'ru', 'sv'
|
|
||||||
]
|
]
|
||||||
},
|
},
|
||||||
# Subtlex languages that need to be pre-processed
|
# Subtlex languages that need to be pre-processed
|
||||||
|
Loading…
Reference in New Issue
Block a user