diff --git a/wordfreq_builder/wordfreq_builder/cli/tokenize_reddit.py b/wordfreq_builder/wordfreq_builder/cli/tokenize_reddit.py index c93af67..6a275b3 100644 --- a/wordfreq_builder/wordfreq_builder/cli/tokenize_reddit.py +++ b/wordfreq_builder/wordfreq_builder/cli/tokenize_reddit.py @@ -4,7 +4,7 @@ import argparse def main(): parser = argparse.ArgumentParser() - parser.add_argument('filename', help='filename of input file containing one tweet per line') + parser.add_argument('filename', help='filename of input file containing one comment per line') parser.add_argument('outprefix', help='prefix of output filenames') args = parser.parse_args() tokenize_by_language(args.filename, args.outprefix, tokenizer=cld2_reddit_tokenizer)