mirror of
https://github.com/rspeer/wordfreq.git
synced 2024-12-23 17:31:41 +00:00
parent
d267e0967c
commit
3446a393c5
@ -9,14 +9,13 @@ CONFIG = {
|
|||||||
# A list of language codes (possibly un-standardized) that we'll
|
# A list of language codes (possibly un-standardized) that we'll
|
||||||
# look up in filenames for these various data sources.
|
# look up in filenames for these various data sources.
|
||||||
'twitter': [
|
'twitter': [
|
||||||
'ar', 'de', 'en', 'es', 'fr', 'id', 'it', 'ja', 'ko', 'ms', 'nl',
|
'ar', 'de', 'el', 'en', 'es', 'fr', 'id', 'it', 'ja', 'ko', 'ms', 'nl',
|
||||||
'pt', 'ru',
|
'pt', 'ru', 'tr'
|
||||||
# can be added later: 'el', 'tr'
|
|
||||||
],
|
],
|
||||||
'wikipedia': [
|
'wikipedia': [
|
||||||
'ar', 'de', 'en', 'es', 'fr', 'id', 'it', 'ja', 'ko', 'ms', 'nl',
|
'ar', 'de', 'en', 'el', 'es', 'fr', 'id', 'it', 'ja', 'ko', 'ms', 'nl',
|
||||||
'pt', 'ru'
|
'pt', 'ru'
|
||||||
# consider adding 'el' and 'tr'
|
# consider adding 'tr'
|
||||||
],
|
],
|
||||||
'opensubtitles': [
|
'opensubtitles': [
|
||||||
# All languages where the most common word in OpenSubtitles
|
# All languages where the most common word in OpenSubtitles
|
||||||
|
Loading…
Reference in New Issue
Block a user