diff --git a/ngrams/top_comment_phrases.py b/ngrams/top_comment_phrases.py index 09e913b..00fcc9e 100755 --- a/ngrams/top_comment_phrases.py +++ b/ngrams/top_comment_phrases.py @@ -57,5 +57,5 @@ df = df.select('phrase','phraseCount','phraseLogProb','phrasePWMI') # df = df.filter(f.col('phraseCount') > 3500).filter(f.col("phrasePWMI")>3) df = df.toPandas() -df.to_feather("/gscratch/comdata/users/nathante/reddit_multiword_expressions.feather") -df.to_csv("/gscratch/comdata/users/nathante/reddit_multiword_expressions.csv") +df.to_feather("/gscratch/comdata/output/reddit_ngrams/reddit_multiword_expressions.feather") +df.to_csv("/gscratch/comdata/output/reddit_ngrams/reddit_multiword_expressions.csv")