typo fix.
This commit is contained in:
parent
8b69801c8d
commit
0bbdc6bd5e
@ -8,7 +8,7 @@ from functools import partial
|
||||
def _tfidf_wrapper(func, inpath, outpath, topN, term_colname, exclude, included_subreddits, included_terms=None, min_df=None, max_df=None):
|
||||
spark = SparkSession.builder.config(map={'spark.executor.memory':'900g','spark.executor.cores':128}).getOrCreate()
|
||||
df = spark.read.parquet(inpath)
|
||||
df = df.repartition(128*15, cols=['subreddit',term_colname])
|
||||
df = df.repartition(128*15, col=['subreddit',term_colname])
|
||||
df = df.filter(~ f.col(term_colname).isin(exclude))
|
||||
|
||||
if included_subreddits is not None:
|
||||
|
Loading…
Reference in New Issue
Block a user