typofix

2024-12-15 08:23:06 -08:00 · 2024-12-15 08:23:06 -08:00 · 52694e0498
commit 52694e0498
parent cb2f2c9717
1 changed files with 1 additions and 1 deletions
--- a/similarities/tfidf.py
+++ b/similarities/tfidf.py
@ -5,7 +5,7 @@ from pyspark.sql import functions as f
 from similarities_helper import tfidf_dataset, build_weekly_tfidf_dataset, select_topN_subreddits
 from functools import partial

- def _tfidf_wrapper(func, inpath, outpath, topN, term_colname, exclude, included_subreddits, included_terms=None, min_df=None, max_df=None):
+def _tfidf_wrapper(func, inpath, outpath, topN, term_colname, exclude, included_subreddits, included_terms=None, min_df=None, max_df=None):
    spark = SparkSession.builder.config(map={'spark.executor.memory':'900g','spark.executor.cores':128}).getOrCreate()
    df = spark.read.parquet(inpath)