allow posts schemas to be nullable.
This commit is contained in:
parent
271cbea7d9
commit
88fca0f82b
@ -126,7 +126,7 @@ def weekly_tf(partition,
|
|||||||
nullable_schema = False
|
nullable_schema = False
|
||||||
elif reddit_dataset == 'posts':
|
elif reddit_dataset == 'posts':
|
||||||
tf_func = tf_posts
|
tf_func = tf_posts
|
||||||
nullable_schema = False
|
nullable_schema = True
|
||||||
|
|
||||||
dataset = ds.dataset(f"{input_parquet}/{partition}", format='parquet')
|
dataset = ds.dataset(f"{input_parquet}/{partition}", format='parquet')
|
||||||
if not os.path.exists(output_10p_sample_path):
|
if not os.path.exists(output_10p_sample_path):
|
||||||
|
Loading…
Reference in New Issue
Block a user