bugfix.
This commit is contained in:
parent
78eb16f4d6
commit
587e1c0022
@ -79,7 +79,10 @@ def weekly_tf(partition,
|
|||||||
if os.path.exists(f"{output_10p_sample_path}/{ngram_output}"):
|
if os.path.exists(f"{output_10p_sample_path}/{ngram_output}"):
|
||||||
os.remove(f"{output_10p_sample_path}/{ngram_output}")
|
os.remove(f"{output_10p_sample_path}/{ngram_output}")
|
||||||
|
|
||||||
batches = dataset.to_batches(columns=['CreatedAt','subreddit','body','author'])
|
if reddit_dataset == 'comments':
|
||||||
|
batches = dataset.to_batches(columns=['CreatedAt','subreddit','body','author'])
|
||||||
|
if reddit_dataset == 'posts':
|
||||||
|
batches = dataset.to_batches(columns=['CreatedAt','subreddit','title','author'])
|
||||||
|
|
||||||
schema = pa.schema([pa.field('subreddit', pa.string(), nullable=False),
|
schema = pa.schema([pa.field('subreddit', pa.string(), nullable=False),
|
||||||
pa.field('term', pa.string(), nullable=False),
|
pa.field('term', pa.string(), nullable=False),
|
||||||
|
Loading…
Reference in New Issue
Block a user