1
0

correct output path.

This commit is contained in:
Nathan TeBlunthuis 2024-12-04 09:07:10 -08:00
parent 85945eae90
commit 472849ebd9

View File

@ -57,5 +57,5 @@ df = df.select('phrase','phraseCount','phraseLogProb','phrasePWMI')
# #
df = df.filter(f.col('phraseCount') > 3500).filter(f.col("phrasePWMI")>3) df = df.filter(f.col('phraseCount') > 3500).filter(f.col("phrasePWMI")>3)
df = df.toPandas() df = df.toPandas()
df.to_feather("/gscratch/comdata/users/nathante/reddit_multiword_expressions.feather") df.to_feather("/gscratch/comdata/output/reddit_ngrams/reddit_multiword_expressions.feather")
df.to_csv("/gscratch/comdata/users/nathante/reddit_multiword_expressions.csv") df.to_csv("/gscratch/comdata/output/reddit_ngrams/reddit_multiword_expressions.csv")