From 638ab7837588ab40b8559f9a3bddb7751c65d1df Mon Sep 17 00:00:00 2001 From: Nathan TeBlunthuis Date: Thu, 19 Dec 2024 23:32:16 -0800 Subject: [PATCH] comment out config. --- similarities/tfidf.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/similarities/tfidf.py b/similarities/tfidf.py index 23e4104..5fae483 100755 --- a/similarities/tfidf.py +++ b/similarities/tfidf.py @@ -6,7 +6,7 @@ from similarities_helper import tfidf_dataset, build_weekly_tfidf_dataset, selec from functools import partial def _tfidf_wrapper(func, inpath, outpath, topN, term_colname, exclude, included_subreddits, included_terms=None, min_df=None, max_df=None): - spark = SparkSession.builder.config(map={'spark.executor.memory':'900g','spark.executor.cores':128}).getOrCreate() + #spark = SparkSession.builder.config(map={'spark.executor.memory':'900g','spark.executor.cores':128}).getOrCreate() df = spark.read.parquet(inpath) df = df.repartition(128*15, ['subreddit',term_colname]) df = df.filter(~ f.col(term_colname).isin(exclude))