diff --git a/ngrams/term_frequencies.py b/ngrams/term_frequencies.py index c74d47e..0e77682 100755 --- a/ngrams/term_frequencies.py +++ b/ngrams/term_frequencies.py @@ -193,7 +193,7 @@ def weekly_tf(partition, outrows = tf_func(subreddit_weeks, mwe_pass, mwe_tokenize, stopWords, Path(output_10p_sample_path) / ngram_output) - outchunksize = 100000 + outchunksize = 10000 Path(output_terms_path).mkdir(parents=True, exist_ok=True) Path(output_authors_path).mkdir(parents=True, exist_ok=True)