diff --git a/ngrams/term_frequencies.py b/ngrams/term_frequencies.py index 17fe900..c74d47e 100755 --- a/ngrams/term_frequencies.py +++ b/ngrams/term_frequencies.py @@ -177,7 +177,7 @@ def weekly_tf(partition, subreddit_weeks = groupby(rows, lambda r: (r.subreddit, r.week)) if mwe_pass != 'first': - mwe_dataset = pd.read_feather(f'/gscratch/comdata/output/reddit_ngrams/multiword_expressions.feather') + mwe_dataset = pd.read_feather(f'/gscratch/comdata/output/reddit_ngrams/reddit_multiword_expressions.feather') mwe_dataset = mwe_dataset.sort_values(['phrasePWMI'],ascending=False) mwe_phrases = list(mwe_dataset.phrase) mwe_phrases = [tuple(s.split(' ')) for s in mwe_phrases]