1
0

rename function.

This commit is contained in:
Nathan TeBlunthuis 2024-12-01 13:44:19 -08:00
parent 3fea1f9388
commit 9df9a8b8ff

View File

@ -239,8 +239,8 @@ def weekly_tf(partition,
writer.close()
author_writer.close()
def sort_tf_comments(input_parquet="/gscratch/comdata/output/temp_reddit_comments_by_subreddit.parquet/",
output_parquet="/gscratch/comdata/output/reddit_comments_by_subreddit.parquet/"):
def sort_tf(input_parquet="/gscratch/comdata/output/temp_reddit_comments_by_subreddit.parquet/",
output_parquet="/gscratch/comdata/output/reddit_comments_by_subreddit.parquet/"):
from pyspark.sql import functions as f
from pyspark.sql import SparkSession
@ -274,4 +274,4 @@ def gen_task_list(mwe_pass='first',
if __name__ == "__main__":
fire.Fire({"gen_task_list":gen_task_list,
"weekly_tf":weekly_tf,
"sort":sort_tf_comments})
"sort":sort_tf})